All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.google.cloud.bigquery.Job Maven / Gradle / Ivy

There is a newer version: 2.44.0
Show newest version
/*
 * Copyright 2015 Google LLC
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *       http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.google.cloud.bigquery;

import static com.google.common.base.Preconditions.checkNotNull;

import com.google.api.gax.retrying.BasicResultRetryAlgorithm;
import com.google.api.gax.retrying.RetrySettings;
import com.google.api.gax.retrying.TimedAttemptSettings;
import com.google.cloud.RetryHelper;
import com.google.cloud.RetryOption;
import com.google.cloud.bigquery.BigQuery.JobOption;
import com.google.cloud.bigquery.BigQuery.QueryResultsOption;
import com.google.cloud.bigquery.BigQuery.TableDataListOption;
import com.google.cloud.bigquery.JobConfiguration.Type;
import com.google.common.collect.ImmutableList;
import java.io.IOException;
import java.io.ObjectInputStream;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import java.util.Objects;
import java.util.concurrent.Callable;
import java.util.concurrent.ExecutionException;
import org.threeten.bp.Duration;

/**
 * A Google BigQuery Job.
 *
 * 

Objects of this class are immutable. To get a {@code Job} object with the most recent * information use {@link #reload}. {@code Job} adds a layer of service-related functionality over * {@link JobInfo}. */ public class Job extends JobInfo { private static final long serialVersionUID = -4324100991693024704L; private static final RetrySettings DEFAULT_JOB_WAIT_SETTINGS = RetrySettings.newBuilder() .setTotalTimeout(Duration.ofHours(12L)) .setInitialRetryDelay(Duration.ofSeconds(1L)) .setRetryDelayMultiplier(2.0) .setJittered(true) .setMaxRetryDelay(Duration.ofMinutes(1L)) .build(); static final RetrySettings DEFAULT_QUERY_JOB_WAIT_SETTINGS = RetrySettings.newBuilder() .setTotalTimeout(Duration.ofHours(12L)) .setInitialRetryDelay(Duration.ofSeconds(3L)) .setRetryDelayMultiplier(1.0) .setJittered(true) .setMaxRetryDelay(Duration.ofSeconds(3L)) .build(); static final QueryResultsOption[] DEFAULT_QUERY_WAIT_OPTIONS = { QueryResultsOption.pageSize(0L), }; private final BigQueryOptions options; private transient BigQuery bigquery; private static final BigQueryRetryConfig DEFAULT_RETRY_CONFIG = BigQueryRetryConfig.newBuilder() .retryOnMessage(BigQueryErrorMessages.RATE_LIMIT_EXCEEDED_MSG) .build(); // retry config with Error Message for RateLimitExceeded Error /** A builder for {@code Job} objects. */ public static final class Builder extends JobInfo.Builder { private final BigQuery bigquery; private final JobInfo.BuilderImpl infoBuilder; Builder(BigQuery bigquery, JobConfiguration configuration) { this.bigquery = bigquery; this.infoBuilder = new JobInfo.BuilderImpl(); this.infoBuilder.setConfiguration(configuration); } Builder(Job job) { this.bigquery = job.bigquery; this.infoBuilder = new JobInfo.BuilderImpl(job); } @Override Builder setEtag(String etag) { infoBuilder.setEtag(etag); return this; } @Override Builder setGeneratedId(String generatedId) { infoBuilder.setGeneratedId(generatedId); return this; } @Override public Builder setJobId(JobId jobId) { infoBuilder.setJobId(jobId); return this; } @Override Builder setSelfLink(String selfLink) { infoBuilder.setSelfLink(selfLink); return this; } @Override Builder setStatus(JobStatus status) { infoBuilder.setStatus(status); return this; } @Override Builder setStatistics(JobStatistics statistics) { infoBuilder.setStatistics(statistics); return this; } @Override Builder setUserEmail(String userEmail) { infoBuilder.setUserEmail(userEmail); return this; } @Override public Builder setConfiguration(JobConfiguration configuration) { infoBuilder.setConfiguration(configuration); return this; } @Override public Job build() { return new Job(bigquery, infoBuilder); } } Job(BigQuery bigquery, JobInfo.BuilderImpl infoBuilder) { super(infoBuilder); this.bigquery = checkNotNull(bigquery); this.options = bigquery.getOptions(); } /** * Checks if this job exists. * *

Example of checking that a job exists. * *

{@code
   * if (!job.exists()) {
   *   // job doesn't exist
   * }
   * }
* * @return {@code true} if this job exists, {@code false} otherwise * @throws BigQueryException upon failure */ public boolean exists() { checkNotDryRun("exists"); return bigquery.getJob(getJobId(), JobOption.fields()) != null; } /** * Checks if this job has completed its execution, either failing or succeeding. If the job does * not exist this method returns {@code true}. * *

Example of waiting for a job until it reports that it is done. * *

{@code
   * while (!job.isDone()) {
   *   Thread.sleep(1000L);
   * }
   * }
* * @return {@code true} if this job is in {@link JobStatus.State#DONE} state or if it does not * exist, {@code false} if the state is not {@link JobStatus.State#DONE} * @throws BigQueryException upon failure */ public boolean isDone() { checkNotDryRun("isDone"); Job job = bigquery.getJob(getJobId(), JobOption.fields(BigQuery.JobField.STATUS)); return job == null || JobStatus.State.DONE.equals(job.getStatus().getState()); } /** * Blocks until this job completes its execution, either failing or succeeding. This method * returns current job's latest information. If the job no longer exists, this method returns * {@code null}. By default, the job status is checked using jittered exponential backoff with 1 * second as an initial delay, 2.0 as a backoff factor, 1 minute as maximum delay between polls, * 12 hours as a total timeout and unlimited number of attempts. * *

Example usage of {@code waitFor()}. * *

{@code
   * Job completedJob = job.waitFor();
   * if (completedJob == null) {
   *   // job no longer exists
   * } else if (completedJob.getStatus().getError() != null) {
   *   // job failed, handle error
   * } else {
   *   // job completed successfully
   * }
   * }
* *

Example usage of {@code waitFor()} with checking period and timeout. * *

{@code
   * Job completedJob =
   *     job.waitFor(
   *         RetryOption.initialRetryDelay(Duration.ofSeconds(1)),
   *         RetryOption.totalTimeout(Duration.ofMinutes(1)));
   * if (completedJob == null) {
   *   // job no longer exists
   * } else if (completedJob.getStatus().getError() != null) {
   *   // job failed, handle error
   * } else {
   *   // job completed successfully
   * }
   * }
* * @param waitOptions options to configure checking period and timeout * @throws BigQueryException upon failure, check {@link BigQueryException#getCause()} for details * @throws InterruptedException if the current thread gets interrupted while waiting for the job * to complete */ public Job waitFor(RetryOption... waitOptions) throws InterruptedException { checkNotDryRun("waitFor"); Object completedJobResponse; if (getConfiguration().getType() == Type.QUERY) { completedJobResponse = waitForQueryResults( RetryOption.mergeToSettings(DEFAULT_JOB_WAIT_SETTINGS, waitOptions), DEFAULT_QUERY_WAIT_OPTIONS); } else { completedJobResponse = waitForJob(RetryOption.mergeToSettings(DEFAULT_QUERY_JOB_WAIT_SETTINGS, waitOptions)); } return completedJobResponse == null ? null : reload(); } /** * Gets the query results of this job. This job must be of type {@code * JobConfiguration.Type.QUERY}, otherwise this method will throw {@link * UnsupportedOperationException}. * *

If the job hasn't finished, this method waits for the job to complete. However, the state of * the current {@code Job} instance is not updated. To get the new state, call {@link * #waitFor(RetryOption...)} or {@link #reload(JobOption...)}. * * @throws BigQueryException upon failure */ public TableResult getQueryResults(QueryResultsOption... options) throws InterruptedException, JobException { checkNotDryRun("getQueryResults"); if (getConfiguration().getType() != Type.QUERY) { throw new UnsupportedOperationException( "Getting query results is supported only for " + Type.QUERY + " jobs"); } List waitOptions = new ArrayList<>(Arrays.asList(DEFAULT_QUERY_WAIT_OPTIONS)); List listOptions = new ArrayList<>(); for (QueryResultsOption option : options) { switch (option.getRpcOption()) { case MAX_RESULTS: listOptions.add(TableDataListOption.pageSize((Long) option.getValue())); break; case PAGE_TOKEN: listOptions.add(TableDataListOption.pageToken((String) option.getValue())); break; case START_INDEX: listOptions.add(TableDataListOption.startIndex((Long) option.getValue())); break; case TIMEOUT: waitOptions.add(QueryResultsOption.maxWaitTime((Long) option.getValue())); break; } } QueryResponse response = waitForQueryResults( DEFAULT_JOB_WAIT_SETTINGS, waitOptions.toArray(new QueryResultsOption[0])); // Get the job resource to determine if it has errored. Job job = this; if (job.getStatus() == null || !JobStatus.State.DONE.equals(job.getStatus().getState())) { job = reload(); } if (job.getStatus() != null && job.getStatus().getError() != null) { throw new BigQueryException( job.getStatus().getExecutionErrors() == null ? ImmutableList.of(job.getStatus().getError()) : ImmutableList.copyOf(job.getStatus().getExecutionErrors())); } // If there are no rows in the result, this may have been a DDL query. // Listing table data might fail, such as with CREATE VIEW queries. // Avoid a tabledata.list API request by returning an empty TableResult. if (response.getTotalRows() == 0) { TableResult emptyTableResult = new EmptyTableResult(response.getSchema()); emptyTableResult.setJobId(job.getJobId()); return emptyTableResult; } TableId table = ((QueryJobConfiguration) getConfiguration()).getDestinationTable() == null ? ((QueryJobConfiguration) job.getConfiguration()).getDestinationTable() : ((QueryJobConfiguration) getConfiguration()).getDestinationTable(); TableResult tableResult = bigquery.listTableData( table, response.getSchema(), listOptions.toArray(new TableDataListOption[0])); tableResult.setJobId(job.getJobId()); return tableResult; } private QueryResponse waitForQueryResults( RetrySettings retrySettings, final QueryResultsOption... resultsOptions) throws InterruptedException { if (getConfiguration().getType() != Type.QUERY) { throw new UnsupportedOperationException( "Waiting for query results is supported only for " + Type.QUERY + " jobs"); } try { return BigQueryRetryHelper.runWithRetries( new Callable() { @Override public QueryResponse call() { return bigquery.getQueryResults(getJobId(), resultsOptions); } }, retrySettings, new BasicResultRetryAlgorithm() { @Override public boolean shouldRetry( Throwable prevThrowable, QueryResponse prevResponse) { // Used by BigQueryRetryAlgorithm.shouldRetryBasedOnResult return prevResponse != null && !prevResponse.getCompleted(); } }, options.getClock(), DEFAULT_RETRY_CONFIG); } catch (BigQueryRetryHelper.BigQueryRetryHelperException e) { throw BigQueryException.translateAndThrow(e); } } private Job waitForJob(RetrySettings waitSettings) throws InterruptedException { try { return RetryHelper.poll( new Callable() { @Override public Job call() throws Exception { return bigquery.getJob(getJobId(), JobOption.fields(BigQuery.JobField.STATUS)); } }, waitSettings, new BasicResultRetryAlgorithm() { @Override public TimedAttemptSettings createNextAttempt( Throwable prevThrowable, Job prevResponse, TimedAttemptSettings prevSettings) { return null; } @Override public boolean shouldRetry(Throwable prevThrowable, Job prevResponse) { return prevResponse != null && !JobStatus.State.DONE.equals(prevResponse.getStatus().getState()); } }, options.getClock()); } catch (ExecutionException e) { throw BigQueryException.translateAndThrow(e); } } /** * Fetches current job's latest information. Returns {@code null} if the job does not exist. * *

Example of reloading all fields until job status is DONE. * *

{@code
   * while (!JobStatus.State.DONE.equals(job.getStatus().getState())) {
   *   Thread.sleep(1000L);
   *   job = job.reload();
   * }
   * }
* *

Example of reloading status field until job status is DONE. * *

{@code
   * while (!JobStatus.State.DONE.equals(job.getStatus().getState())) {
   *   Thread.sleep(1000L);
   *   job = job.reload(BigQuery.JobOption.fields(BigQuery.JobField.STATUS));
   * }
   * }
* * @param options job options * @return a {@code Job} object with latest information or {@code null} if not found * @throws BigQueryException upon failure */ public Job reload(JobOption... options) { checkNotDryRun("reload"); Job job = bigquery.getJob(getJobId(), options); if (job != null && job.getStatus().getError() != null) { throw new BigQueryException( job.getStatus().getExecutionErrors() == null ? ImmutableList.of(job.getStatus().getError()) : ImmutableList.copyOf(job.getStatus().getExecutionErrors())); } return job; } /** * Sends a job cancel request. * *

Example of cancelling a job. * *

{@code
   * if (job.cancel()) {
   *   return true; // job successfully cancelled
   * } else {
   *   // job not found
   * }
   * }
* * @return {@code true} if cancel request was sent successfully, {@code false} if job was not * found * @throws BigQueryException upon failure */ public boolean cancel() { checkNotDryRun("cancel"); return bigquery.cancel(getJobId()); } private void checkNotDryRun(String op) { checkNotDryRun(getConfiguration(), op); } static void checkNotDryRun(JobConfiguration jobConfig, String op) { QueryJobConfiguration config; if (jobConfig instanceof QueryJobConfiguration) { config = (QueryJobConfiguration) jobConfig; } else { return; } Boolean dryRun = config.dryRun(); if (dryRun == null) { dryRun = false; } if (dryRun) { String msg = "Operation \"%s\" does not work for dryrun queries, " + "since a dry run does not actually create a job. " + "To validate a query and obtain some processing statistics, consider calling " + "BigQuery.create(JobInfo)."; throw new UnsupportedOperationException(String.format(msg, op)); } } /** Returns the job's {@code BigQuery} object used to issue requests. */ public BigQuery getBigQuery() { return bigquery; } @Override public Builder toBuilder() { return new Builder(this); } @Override public final boolean equals(Object obj) { if (obj == this) { return true; } if (obj == null || !obj.getClass().equals(Job.class)) { return false; } Job other = (Job) obj; return Objects.equals(toPb(), other.toPb()) && Objects.equals(options, other.options); } @Override public final int hashCode() { return Objects.hash(super.hashCode(), options); } private void readObject(ObjectInputStream in) throws IOException, ClassNotFoundException { in.defaultReadObject(); this.bigquery = options.getService(); } static Job fromPb(BigQuery bigquery, com.google.api.services.bigquery.model.Job jobPb) { return new Job(bigquery, new JobInfo.BuilderImpl(jobPb)); } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy