All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.google.cloud.hadoop.io.bigquery.Export Maven / Gradle / Ivy

There is a newer version: 0.13.4-hadoop3
Show newest version
package com.google.cloud.hadoop.io.bigquery;

import java.io.IOException;
import java.util.List;
import org.apache.hadoop.mapreduce.InputSplit;
import org.apache.hadoop.mapreduce.JobContext;

/**
 * A single BigQuery export for the purpose of running a Hadoop MapReduce.
 */
public interface Export {

  /**
   * Create any temporary directories, tables, etc
   */
  void prepare() throws IOException;

  /**
   * Start exporting data
   */
  void beginExport() throws IOException;

  /**
   * Wait for enough data to be available for us to start a MapReduce. This may be all data
   * or no data.
   */
  void waitForUsableMapReduceInput() throws IOException, InterruptedException;

  /**
   * Get input splits that should be passed to Hadoop.
   */
  List getSplits(JobContext context) throws IOException, InterruptedException;

  /**
   * Get a list of export paths to provide to BigQuery
   */
  List getExportPaths() throws IOException;

  /**
   * Delete any temp tables or temporary data locations.
   */
  void cleanupExport() throws IOException;
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy