net.starschema.clouddb.jdbc.BQSupportFuncts Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of bqjdbc Show documentation
A simple JDBC driver, to reach Google's BigQuery
The newest version!
/**
 * Copyright (c) 2015, STARSCHEMA LTD. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without modification, are permitted
 * provided that the following conditions are met:
 *
 * 
1. Redistributions of source code must retain the above copyright notice, this list of
 * conditions and the following disclaimer. 2. Redistributions in binary form must reproduce the
 * above copyright notice, this list of conditions and the following disclaimer in the documentation
 * and/or other materials provided with the distribution.
 *
 * 
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
 * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY
 * WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *
 * 
This class implements functions such as connecting to Bigquery, Checking out the results and
 * displaying them on console
 */
package net.starschema.clouddb.jdbc;

import com.google.api.services.bigquery.Bigquery;
import com.google.api.services.bigquery.Bigquery.Jobs.Insert;
import com.google.api.services.bigquery.model.*;
import com.google.api.services.bigquery.model.DatasetList.Datasets;
import com.google.api.services.bigquery.model.ProjectList.Projects;
import com.google.api.services.bigquery.model.TableList.Tables;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.UnsupportedEncodingException;
import java.math.BigInteger;
import java.net.URLDecoder;
import java.net.URLEncoder;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import java.util.Properties;
import java.util.UUID;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.stream.Stream;
import net.starschema.clouddb.jdbc.BQConnection.JobCreationMode;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

// import net.starschema.clouddb.bqjdbc.logging.Logger;

/**
 * This class contains static methods for interacting with BigQuery
 *
 * @author Gunics Balázs, Horváth Attila
 */
public class BQSupportFuncts {
  /** log4j.Logger instance */
  static Logger logger = LoggerFactory.getLogger(BQSupportFuncts.class);

  /**
   * Constructs a valid BigQuery JDBC driver URL from the specified properties File
   *
   * @param properties Properties File most commonly read by ReadUrlFromPropFile(String)
   * @return a valid BigQuery JDBC driver URL or null if it fails to load
   * @throws UnsupportedEncodingException
   */
  public static String constructUrlFromPropertiesFile(
      Properties properties, boolean full, String dataset) throws UnsupportedEncodingException {
    String projectId = properties.getProperty("projectid"); // Represents the billing project.
    logger.debug("projectId is: " + projectId);
    String User = properties.getProperty("user");
    String Password = properties.getProperty("password");
    String path = properties.getProperty("path");
    // The dataset property value can optionally include a reference to a project id, which will be
    // used in conjunction with the default dataset to handle unqualified table references.
    dataset = dataset == null ? properties.getProperty("dataset") : dataset;

    String forreturn = "";
    // Set to '?' for the first param and '&' for subsequent params.
    String paramSep = "?";

    if (properties.getProperty("type").equals("installed")) {
      if (User != null && Password != null && projectId != null) {
        forreturn = BQDriver.getURLPrefix() + URLEncoder.encode(projectId, "UTF-8");
      } else {
        return null;
      }
    } else if (properties.getProperty("type").equals("service")) {
      if (User != null && Password != null && projectId != null) {
        forreturn =
            BQDriver.getURLPrefix()
                + URLEncoder.encode(projectId, "UTF-8")
                + (dataset != null && full ? "/" + URLEncoder.encode(dataset, "UTF-8") : "")
                + "?withServiceAccount=true";
        paramSep = "&";
        if (full) {
          forreturn +=
              "&user="
                  + URLEncoder.encode(User, "UTF-8")
                  + "&password="
                  + URLEncoder.encode(Password, "UTF-8");
          if (path != null) {
            forreturn += "&path=" + URLEncoder.encode(path, "UTF-8");
          }
        }
      } else {
        return null;
      }
    } else if (properties.getProperty("type").equals("oauth")) {
      String accessToken = properties.getProperty("oauthaccesstoken");
      if (accessToken != null && projectId != null) {
        forreturn =
            BQDriver.getURLPrefix()
                + URLEncoder.encode(projectId, "UTF-8")
                + (dataset != null && full ? "/" + URLEncoder.encode(dataset, "UTF-8") : "");
        if (full) {
          forreturn += "?oAuthAccessToken=" + URLEncoder.encode(accessToken, "UTF-8");
          paramSep = "&";
        }
      } else {
        return null;
      }
    } else if (properties.getProperty("type").equals("applicationDefault")) {
      forreturn =
          BQDriver.getURLPrefix()
              + URLEncoder.encode(projectId, "UTF-8")
              + (dataset != null && full ? "/" + URLEncoder.encode(dataset, "UTF-8") : "")
              + "?withApplicationDefaultCredentials=true";
      paramSep = "&";
    } else {
      return null;
    }

    String useLegacySql = properties.getProperty("useLegacySql");
    if (useLegacySql != null) {
      forreturn += paramSep + "useLegacySql=" + useLegacySql;
      paramSep = "&";
    }

    String rootUrl = properties.getProperty("rootUrl");
    if (rootUrl != null) {
      forreturn += paramSep + "rootUrl=" + URLEncoder.encode(rootUrl, "UTF-8");
      paramSep = "&";
    }

    String useQueryCache = properties.getProperty("queryCache");
    if (useQueryCache != null) {
      forreturn += paramSep + "queryCache=" + URLEncoder.encode(useQueryCache, "UTF-8");
      paramSep = "&";
    }

    String timeoutMs = properties.getProperty("timeoutMs");
    if (timeoutMs != null) {
      forreturn += paramSep + "timeoutMs=" + URLEncoder.encode(timeoutMs, "UTF-8");
      paramSep = "&";
    }

    return forreturn;
  }

  public static String constructUrlFromPropertiesFile(Properties properties)
      throws UnsupportedEncodingException {
    return constructUrlFromPropertiesFile(properties, false, null);
  }

  public static Properties getUrlQueryComponents(String url, Properties defaults)
      throws UnsupportedEncodingException {
    String[] splitAtQP = url.split("\\?");
    Properties components = (Properties) defaults.clone();

    if (splitAtQP.length == 1) {
      return components;
    }

    String queryString = splitAtQP[1];

    String[] querySubComponents = queryString.split("&");
    for (String subComponent : querySubComponents) {
      Matcher m = Pattern.compile("(.*)=(.*)").matcher(subComponent);
      if (m.find()) {
        components.setProperty(m.group(1).toLowerCase(), URLDecoder.decode(m.group(2), "UTF-8"));
      }
    }

    return components;
  }

  /**
   * Return a list of Projects which contains the String catalogname
   *
   * @param projectIdFilter The String which the id of the result Projects must contain
   * @param Connection A valid BQConnection instance
   * @return a list of Projects which contains the String catalogname
   * @throws IOException
   *     
if the initialization of requesting the list of all Projects (to be sorted from) fails
   */
  private static List getProjects(String projectIdFilter, BQConnection Connection)
      throws IOException {
    logger.debug(
        "Function call getProjects catalogName: "
            + (projectIdFilter != null ? projectIdFilter : "null"));
    List projects = Connection.getBigquery().projects().list().execute().getProjects();

    if (projects != null && projects.size() != 0) { // we got projects!
      if (projectIdFilter != null) {
        List ProjectsSearch = new ArrayList();
        for (Projects project : projects) {
          if (project.getId().equals(projectIdFilter)) {
            ProjectsSearch.add(project);
          }
        }
        if (ProjectsSearch.size() == 0) {
          return null;
        } else {
          return ProjectsSearch;
        }
      } else {
        return projects;
      }
    } else {
      return null;
    }
  }

  /**
   * Returns a list of Datasets, which are associated with the Project which's id is exactly
   * ProjectId, and their name matches datasetnamepattern
   *
   * @param datasetname The String the dataset's id must contain
   * @param projectId The Id of the Project the dataset is preferably contained in
   * @param connection A valid BQConnection Instance
   * @return a list of Datasets, which are associated with the Project which's id is exactly
   *     ProjectId, and their name contains datasetname
   * @throws IOException
   *     
if the request to get Projects that match the given ProjectId fails
   */
  private static List getDatasets(
      String projectId, String datasetname, BQConnection connection) throws IOException {
    logger.debug(
        "function call getDatasets, "
            + "datasetName: "
            + (datasetname != null ? datasetname : "null")
            + ", projectId: "
            + (projectId != null ? projectId : "null"));
    List datasetcontainer =
        connection.getBigquery().datasets().list(projectId).execute().getDatasets();

    if (datasetcontainer != null && datasetcontainer.size() != 0) {
      if (datasetname != null) {
        List datasetsSearch = new ArrayList();
        for (Datasets in : datasetcontainer) {
          if (matchPattern(in.getDatasetReference().getDatasetId(), datasetname)) {
            datasetsSearch.add(in);
          }
        }
        if (datasetsSearch.size() == 0) {
          return null;
        } else {
          return datasetsSearch;
        }
      } else {
        return datasetcontainer;
      }
    } else {
      return null;
    }
  }

  /**
   * Returns the result of a completed query
   *
   * @param bigquery Instance of authorized Bigquery client
   * @param projectId The id of the Project the completed job was run in
   * @param completedJob The Job instance of the completed job
   * @return the result of a completed query specified by projectId and completedJob
   * @throws IOException
   *     
if the request to get QueryResults specified by the given ProjectId and Job id fails
   */
  public static GetQueryResultsResponse getQueryResults(
      Bigquery bigquery, String projectId, Job completedJob) throws IOException {
    JobReference completedJobReference = completedJob.getJobReference();
    GetQueryResultsResponse queryResult =
        bigquery
            .jobs()
            .getQueryResults(projectId, completedJobReference.getJobId())
            .setLocation(completedJobReference.getLocation())
            .execute();
    long totalRows = queryResult.getTotalRows().longValue();
    if (totalRows == 0) {
      return queryResult;
    }
    while (totalRows > (long) queryResult.getRows().size()) {
      queryResult
          .getRows()
          .addAll(
              bigquery
                  .jobs()
                  .getQueryResults(projectId, completedJobReference.getJobId())
                  .setLocation(completedJobReference.getLocation())
                  .setStartIndex(BigInteger.valueOf((long) queryResult.getRows().size()))
                  .execute()
                  .getRows());
    }
    return queryResult;
  }

  /**
   * Returns the result of a completed query
   *
   * @param bigquery Instance of authorized Bigquery client
   * @param projectId The id of the Project the completed job was run in
   * @param completedJob The Job instance of the completed job
   * @return the result of a completed query specified by projectId and completedJob
   * @throws IOException
   *     
if the request to get QueryResults specified by the given ProjectId and Job id fails
   */
  public static GetQueryResultsResponse getQueryResultsDivided(
      Bigquery bigquery, String projectId, Job completedJob, BigInteger startAtRow, int fetchCount)
      throws IOException {
    GetQueryResultsResponse queryResult;
    JobReference completedJobReference = completedJob.getJobReference();
    queryResult =
        bigquery
            .jobs()
            .getQueryResults(projectId, completedJobReference.getJobId())
            .setLocation(completedJobReference.getLocation())
            .setStartIndex(startAtRow)
            .setMaxResults((long) fetchCount)
            .execute();
    return queryResult;
  }

  public static Job getPollJob(JobReference jobRef, Bigquery bq, String projectId)
      throws IOException {
    return bq.jobs().get(projectId, jobRef.getJobId()).setLocation(jobRef.getLocation()).execute();
  }

  /**
   * Returns the status of a job
   *
   * @param myjob Instance of Job
   * @param bigquery Instance of authorized Bigquery client
   * @param projectId The id of the Project the job is contained in
   * @return the status of the job
   * @throws IOException
   *     
if the request to get the job specified by myjob and projectId fails
   */
  public static String getQueryState(Job myjob, Bigquery bigquery, String projectId)
      throws IOException {
    JobReference myjobReference = myjob.getJobReference();
    Job pollJob = getPollJob(myjobReference, bigquery, projectId);
    return logAndGetQueryState(pollJob);
  }

  /**
   * Logs the status and running time of a job and returns its current state
   *
   * @param pollJob Instance of Job
   * @return the status of the job
   * @throws IOException
   *     
if the request to get the job specified by myjob and projectId fails
   */
  public static String logAndGetQueryState(Job pollJob) throws IOException {
    if (pollJob == null
        || pollJob.isEmpty()
        || pollJob.getStatus().isEmpty()
        || pollJob.getStatistics().isEmpty()) {
      throw new IOException("Failed to fetch query state.");
    }
    JobStatistics stats = pollJob.getStatistics();
    long startTime =
        Stream.of(stats.getCreationTime(), stats.getStartTime())
            .filter(Objects::nonNull)
            .findFirst()
            .orElseThrow(
                () -> new IllegalStateException("Failed to fetch start or creation time."));
    BQSupportFuncts.logger.info(
        "Job status: "
            + pollJob.getStatus().getState()
            + " ; "
            + pollJob.getJobReference().getJobId()
            + " ; "
            + (System.currentTimeMillis() - startTime));
    return pollJob.getStatus().getState();
  }

  /**
   * Cancels a job. Uses the fact that it returns a JobCancelResponse to help enforce actually
   * calling .execute().
   *
   * @param jobReference Instance of JobReference to cancel
   * @param bigquery Instance of authorized Bigquery client
   * @param projectId The id of the Project the job is contained in
   */
  public static JobCancelResponse cancelQuery(
      JobReference jobReference, Bigquery bigquery, String projectId) throws IOException {
    return bigquery
        .jobs()
        .cancel(projectId, jobReference.getJobId())
        .setLocation(jobReference.getLocation())
        .execute();
  }

  /**
   * Returns a list of Tables which's id matches TablenamePattern and are exactly in the given
   * Project and Dataset
   *
   * @param tableNamePattern String that the tableid must contain
   * @param projectId The exact Id of the Project that the tables must be in
   * @param datasetId The exact Id of the Dataset that the tables must be in
   * @param connection Instance of a valid BQConnection
   * @return a list of Tables which's id contains Tablename and are exactly in the given Project and
   *     Dataset
   * @throws IOException
   *     
if the request to get all tables (to sort from) specified by ProjectId, DatasetId fails
   */
  private static List getTables(
      String tableNamePattern, String projectId, String datasetId, BQConnection connection)
      throws IOException {
    logger.debug(
        "Function call getTables : "
            + "tableNamePattern: "
            + (tableNamePattern != null ? tableNamePattern : "null")
            + ", projectId: "
            + (projectId != null ? projectId : "null")
            + ", datasetID:"
            + (datasetId != null ? datasetId : "null")
            + "connection");
    Bigquery.Tables.List listCall =
        connection
            .getBigquery()
            .tables()
            .list(projectId, datasetId)
            .setMaxResults(10000000L); // Really big number that we'll never hit
    List tables = listCall.execute().getTables();
    if (tables != null && tables.size() != 0) {
      if (tableNamePattern != null) {
        List tablesSearch = new ArrayList();
        for (Tables in : tables) {
          if (matchPattern(in.getTableReference().getTableId(), tableNamePattern)) {
            tablesSearch.add(in);
          }
        }
        if (tablesSearch.size() == 0) {
          logger.debug("returning null");
          return null;
        } else {
          return tablesSearch;
        }
      } else {
        return tables;
      }
    } else {
      logger.debug("returning null");
      return null;
    }
  }

  /**
   * Gets Tables information from specific projects matching catalog, tablenamepattern and
   * datasetidpatterns
   *
   * @param connection Valid instance of BQConnection
   * @return List of Table
   * @throws IOException
   *     
if the initialization of requesting the list of all Projects (to be sorted from) fails
   *     

   *     if the request to get Projects that match the given ProjectId fails

   *     if the request to get all tables (to sort from) specified by ProjectId, DatasetId fails

   *     if the request to get table information based on ProjectId DatasetId TableId fails
   *     

   */
  public static List getTables(
      BQConnection connection, String projectIdFilter, String schema, String tablename)
      throws IOException {
    List
 RET = new ArrayList();
    logger.debug(
        "Function call getTables : "
            + "projectIdFilter: "
            + (projectIdFilter != null ? projectIdFilter : "null")
            + ", schema: "
            + (schema != null ? schema : "null")
            + ", tablename:"
            + (tablename != null ? tablename : "null")
            + "connection");
    // getting the projects for this connection
    List Projects = BQSupportFuncts.getProjects(projectIdFilter, connection);

    if (Projects != null && Projects.size() != 0) {
      for (Projects proj : Projects) {
        String projectId = proj.getId();
        List datasetlist = null;
        datasetlist = BQSupportFuncts.getDatasets(projectId, schema, connection);
        if (datasetlist != null && datasetlist.size() != 0) {
          for (Datasets dataset : datasetlist) {
            List tables = null;

            String datasetId = dataset.getDatasetReference().getDatasetId();
            tables = BQSupportFuncts.getTables(tablename, projectId, datasetId, connection);

            if (tables != null && tables.size() != 0) {
              for (Tables table : tables) {
                String tableString = table.getTableReference().getTableId();
                logger.debug(
                    "Calling connection.getBigquery().tables() "
                        + "dataset is: "
                        + datasetId
                        + ", table is: "
                        + tableString
                        + ", project is: "
                        + projectId);
                Table tbl =
                    connection
                        .getBigquery()
                        .tables()
                        .get(projectId, datasetId, tableString)
                        .execute();
                if (tbl != null) {
                  RET.add(tbl);
                }
              }
            }
          }
        }
      }
      if (RET.size() == 0) {
        return null;
      } else {
        return RET;
      }
    } else {
      return null;
    }
  }

  /**
   * 

   * Some DatabaseMetaData methods take arguments that are String patterns. These arguments all have
   * names such as fooPattern. Within a pattern String, "%" means match any substring of 0 or more
   * characters, and "_" means match any one character. Only metadata entries matching the search
   * pattern are returned. If a search pattern argument is set to null, that argument's criterion
   * will be dropped from the search.
   *
   * Checks if the input String matches the pattern string which may contain %, which means it
   * can be any character
   *
   * @param input
   * @param pattern
   * @return true if matches, false if not
   */
  public static boolean matchPattern(String input, String pattern) {
    if (pattern == null) {
      return true;
    }

    boolean regexexpression = false;
    String regexexpressionstring = null;

    if (pattern.contains("%")) {
      regexexpression = true;

      if (regexexpressionstring == null) {
        regexexpressionstring = pattern.replace("%", ".*");
      }
    }
    if (pattern.contains("_")) {
      regexexpression = true;

      if (regexexpressionstring == null) {
        regexexpressionstring = pattern.replace("_", ".");
      } else {
        regexexpressionstring = regexexpressionstring.replace("_", ".");
      }
    }
    if (regexexpression) {
      return input.matches(regexexpressionstring);
    } else {
      // return input.contains(pattern);
      return input.equals(pattern);
    }
  }

  /**
   * Convert Bigquery field type to java.sql.Types
   *
   * @param columntype String of the Column type
   * @return java.sql.Types value of the given Columtype
   */
  public static int parseToSqlFieldType(String columntype) {
    if (columntype.equals("FLOAT")) {
      return java.sql.Types.FLOAT;
    } else if (columntype.equals("BOOLEAN")) {
      return java.sql.Types.BOOLEAN;
    } else if (columntype.equals("INTEGER")) {
      return java.sql.Types.INTEGER;
    } else if (columntype.equals("STRING")) {
      return java.sql.Types.VARCHAR;
    } else if (columntype.equals("BIGINT")) {
      return java.sql.Types.BIGINT;
    } else {
      return 0;
    }
  }

  /**
   * Reads Properties File from location
   *
   * @param filePath Location of the Properties File
   * @return Properties The Properties object made from the Properties File
   * @throws IOException if the load from file fails
   */
  public static Properties readFromPropFile(String filePath) throws IOException {
    // Read properties file.
    Properties properties = new Properties();
    properties.load(new FileInputStream(filePath));

    return properties;
  }

  /**
   * Run a query using the synchronous jobs.query() BigQuery endpoint.
   *
   * @param bigquery The BigQuery API wrapper
   * @param projectId The ProjectId to use for billing
   * @param querySql The SQL to execute
   * @param dataSet default dataset, can be null
   * @param dataSetProjectId default dataset project id, only specified when the default dataset is
   *     non-null
   * @param useLegacySql Use the legacy SQL dialect when true
   * @param maxBillingBytes Maximum bytes that the API will allow to bill
   * @param queryTimeoutMs The timeout at which point the API will return with an incomplete result
   *     NOTE: this does _not_ mean the query fails, just we have to get the results async
   * @param maxResults The maximum number of rows to return with the synchronous response Can be
   *     null for no max, but the API always has a 10MB limit If more results exist, we need to
   *     fetch them in subsequent API requests.
   * @return A [QueryResponse] with the results of the query, may be incomplete, may not have all
   *     rows.
   * @throws IOException
   */
  static QueryResponse runSyncQuery(
      Bigquery bigquery,
      String projectId,
      String querySql,
      String dataSet,
      String dataSetProjectId,
      Boolean useLegacySql,
      Long maxBillingBytes,
      Long queryTimeoutMs,
      Long maxResults,
      Map labels,
      boolean useQueryCache,
      JobCreationMode jobCreationMode)
      throws IOException {
    return getSyncQuery(
            bigquery,
            projectId,
            querySql,
            dataSet,
            dataSetProjectId,
            useLegacySql,
            maxBillingBytes,
            queryTimeoutMs,
            maxResults,
            labels,
            useQueryCache,
            jobCreationMode)
        .execute();
  }

  /*
   * Gets a query as specified, but does not execute it.
   * Introduced for assertions on the property of the query.
   * */
  static Bigquery.Jobs.Query getSyncQuery(
      Bigquery bigquery,
      String projectId,
      String querySql,
      String dataSet,
      String dataSetProjectId,
      Boolean useLegacySql,
      Long maxBillingBytes,
      Long queryTimeoutMs,
      Long maxResults,
      Map labels,
      boolean useQueryCache,
      JobCreationMode jobCreationMode)
      throws IOException {
    QueryRequest qr =
        new QueryRequest()
            .setLabels(labels)
            .setUseQueryCache(useQueryCache)
            .setTimeoutMs(queryTimeoutMs)
            .setQuery(querySql)
            .setUseLegacySql(useLegacySql)
            .setMaximumBytesBilled(maxBillingBytes);
    if (jobCreationMode != null) {
      qr = qr.setJobCreationMode(jobCreationMode.name());
    }
    if (dataSet != null) {
      qr.setDefaultDataset(
          new DatasetReference().setDatasetId(dataSet).setProjectId(dataSetProjectId));
    }
    if (maxResults != null) {
      qr.setMaxResults(maxResults);
    }

    return bigquery.jobs().query(projectId, qr);
  }

  /**
   * Starts a new query in async mode.
   *
   * 
This method exists to maintain backwards compatibility with prior bqjdbc releases.
   *
   * @param bigquery The bigquery instance, which is authorized
   * @param projectId The project ID to use for both the billing and default dataset project ids
   * @param querySql The sql query which we want to run
   * @param dataSet The default dataset, can be null
   * @param useLegacySql Use the legacy SQL dialect when true
   * @param maxBillingBytes Maximum bytes that the API will allow to bill
   * @return A JobReference which we'll use to poll the bigquery, for its state, then for its mined
   *     data.
   * @throws IOException
   *     
if the request for initializing or executing job fails
   */
  public static Job startQuery(
      Bigquery bigquery,
      String projectId,
      String querySql,
      String dataSet,
      Boolean useLegacySql,
      Long maxBillingBytes)
      throws IOException {
    return startQuery(
        bigquery, projectId, querySql, dataSet, projectId, useLegacySql, maxBillingBytes);
  }

  /**
   * Starts a new query in async mode.
   *
   * @param bigquery The bigquery instance, which is authorized
   * @param projectId The project ID to use for billing
   * @param querySql The sql query which we want to run
   * @param dataSet The default dataset, can be null
   * @param dataSetProjectId The default dataset project id, only specified when the default dataset
   *     is non-null
   * @param useLegacySql Use the legacy SQL dialect when true
   * @return A JobReference which we'll use to poll the bigquery, for its state, then for its mined
   *     data.
   * @throws IOException
   *     
if the request for initializing or executing job fails
   */
  public static Job startQuery(
      Bigquery bigquery,
      String projectId,
      String querySql,
      String dataSet,
      String dataSetProjectId,
      Boolean useLegacySql,
      Long maxBillingBytes)
      throws IOException {
    Job job = new Job();
    JobConfiguration config = new JobConfiguration();
    JobConfigurationQuery queryConfig = new JobConfigurationQuery();
    queryConfig.setUseLegacySql(useLegacySql);
    queryConfig.setMaximumBytesBilled(maxBillingBytes);
    config.setQuery(queryConfig);
    String jobId = UUID.randomUUID().toString().replace("-", "");
    JobReference jobReference = new JobReference().setProjectId(projectId).setJobId(jobId);
    job.setJobReference(jobReference);

    if (dataSet != null)
      queryConfig.setDefaultDataset(
          new DatasetReference().setDatasetId(dataSet).setProjectId(dataSetProjectId));

    job.setConfiguration(config);
    queryConfig.setQuery(querySql);

    Insert insert = bigquery.jobs().insert(querySql, job);
    insert.setProjectId(projectId);
    BQSupportFuncts.logger.info(
        "Inserting Query Job ("
            + jobId
            + "): "
            + querySql.replace("\t", "").replace("\n", " ").replace("\r", ""));
    return insert.execute();
  }
}
    

    







    © 2015 - 2025 Weber Informatics LLC | Privacy Policy