All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.gobblin.converter.AsyncHttpJoinConverter Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.gobblin.converter;

import java.io.IOException;
import java.util.Queue;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.LinkedBlockingDeque;

import org.apache.avro.generic.GenericRecord;

import com.google.common.collect.ImmutableMap;
import com.typesafe.config.Config;
import com.typesafe.config.ConfigFactory;

import lombok.Getter;
import lombok.extern.slf4j.Slf4j;

import org.apache.gobblin.async.AsyncRequest;
import org.apache.gobblin.async.AsyncRequestBuilder;
import org.apache.gobblin.async.BufferedRecord;
import org.apache.gobblin.async.Callback;
import org.apache.gobblin.broker.gobblin_scopes.GobblinScopeTypes;
import org.apache.gobblin.broker.iface.SharedResourcesBroker;
import org.apache.gobblin.config.ConfigBuilder;
import org.apache.gobblin.configuration.ConfigurationKeys;
import org.apache.gobblin.configuration.State;
import org.apache.gobblin.configuration.WorkUnitState;
import org.apache.gobblin.http.HttpClient;
import org.apache.gobblin.http.HttpOperation;
import org.apache.gobblin.http.ResponseHandler;
import org.apache.gobblin.http.ResponseStatus;
import org.apache.gobblin.net.Request;
import org.apache.gobblin.utils.HttpConstants;
import org.apache.gobblin.writer.WriteCallback;
import edu.umd.cs.findbugs.annotations.SuppressWarnings;

/**
 * This converter converts an input record (DI) to an output record (DO) which
 * contains original input data and http request & response info.
 *
 * Sequence:
 * Convert DI to HttpOperation
 * Convert HttpOperation to RQ (by internal AsyncRequestBuilder)
 * Execute http request, get response RP (by HttpClient)
 * Combine info (DI, RQ, RP, status, etc..) to generate output DO
 */
@Slf4j
public abstract class AsyncHttpJoinConverter extends AsyncConverter1to1 {
  public static final String CONF_PREFIX = "gobblin.converter.http.";
  public static final Config DEFAULT_FALLBACK =
      ConfigFactory.parseMap(ImmutableMap.builder()
          .put(HttpConstants.CONTENT_TYPE, "application/json")
          .put(HttpConstants.VERB, "GET")
          .build());

  protected HttpClient httpClient = null;
  protected ResponseHandler responseHandler = null;
  protected AsyncRequestBuilder requestBuilder = null;
  protected boolean skipFailedRecord;

  public AsyncHttpJoinConverter init(WorkUnitState workUnitState) {
    super.init(workUnitState);
    Config config = ConfigBuilder.create().loadProps(workUnitState.getProperties(), CONF_PREFIX).build();
    config = config.withFallback(DEFAULT_FALLBACK);
    skipFailedRecord = workUnitState.getPropAsBoolean(ConfigurationKeys.CONVERTER_SKIP_FAILED_RECORD, false);
    httpClient = createHttpClient(config, workUnitState.getTaskBroker());
    responseHandler = createResponseHandler(config);
    requestBuilder = createRequestBuilder(config);
    return this;
  }

  @Override
  public final SO convertSchema(SI inputSchema, WorkUnitState workUnitState)
      throws SchemaConversionException {
    return convertSchemaImpl(inputSchema, workUnitState);
  }

  protected abstract HttpClient   createHttpClient(Config config, SharedResourcesBroker broker);
  protected abstract ResponseHandler createResponseHandler(Config config);
  protected abstract AsyncRequestBuilder createRequestBuilder(Config config);
  protected abstract HttpOperation generateHttpOperation (DI inputRecord, State state);
  protected abstract SO convertSchemaImpl (SI inputSchema, WorkUnitState workUnitState) throws SchemaConversionException;
  protected abstract DO convertRecordImpl (SO outputSchema, DI input, RQ rawRequest, ResponseStatus status) throws DataConversionException;

  /**
   * A helper class which performs the conversion from http response to DO type output, saved as a {@link CompletableFuture}
   */
  private class AsyncHttpJoinConverterContext {
    private final CompletableFuture future;
    private final AsyncHttpJoinConverter converter;

    @Getter
    private final Callback callback;

    public AsyncHttpJoinConverterContext(AsyncHttpJoinConverter converter, SO outputSchema, DI input, Request request) {
      this.future = new CompletableFuture();
      this.converter = converter;
      this.callback = new Callback() {
        @Override
        public void onSuccess(RP result) {
          try {
            ResponseStatus status = AsyncHttpJoinConverterContext.this.converter.responseHandler.handleResponse(request, result);
            switch (status.getType()) {
              case OK:
                AsyncHttpJoinConverterContext.this.onSuccess(request.getRawRequest(), status, outputSchema, input);
                break;
              case CLIENT_ERROR:
                log.error ("Http converter client error with request {}", request.getRawRequest());
                AsyncHttpJoinConverterContext.this.onSuccess(request.getRawRequest(), status, outputSchema, input);
                break;
              case SERVER_ERROR:
                // Server side error. Retry
                log.error ("Http converter server error with request {}", request.getRawRequest());
                throw new DataConversionException(request.getRawRequest() + " send failed due to server error");
              default:
                throw new DataConversionException(request.getRawRequest() + " Should not reach here");
            }
          } catch (Exception e) {
            log.error ("Http converter exception {} with request {}", e.toString(), request.getRawRequest());
            AsyncHttpJoinConverterContext.this.future.completeExceptionally(e);
          }
        }

        @SuppressWarnings(value = "NP_NONNULL_PARAM_VIOLATION",
            justification = "CompletableFuture will replace null value with NIL")
        @Override
        public void onFailure(Throwable throwable) {
          log.error ("Http converter on failure with request {}", request.getRawRequest());

          if (skipFailedRecord) {
            AsyncHttpJoinConverterContext.this.future.complete( null);
          } else {
            AsyncHttpJoinConverterContext.this.future.completeExceptionally(throwable);
          }
        }
      };
    }

    private void onSuccess(RQ rawRequest, ResponseStatus status, SO outputSchema, DI input) throws DataConversionException {
      log.debug("{} send with status type {}", rawRequest, status.getType());
      DO output = this.converter.convertRecordImpl(outputSchema, input, rawRequest, status);
      AsyncHttpJoinConverterContext.this.future.complete(output);
    }
  }

  /**
   * Convert an input record to a future object where an output record will be filled in sometime later
   * Sequence:
   *    Convert input (DI) to an http request
   *    Send http request asynchronously, and registers an http callback
   *    Create an {@link CompletableFuture} object. When the callback is invoked, this future object is filled in by an output record which is converted from http response.
   *    Return the future object.
   */
  @Override
  public final CompletableFuture convertRecordAsync(SO outputSchema, DI inputRecord, WorkUnitState workUnitState)
      throws DataConversionException {

    // Convert DI to HttpOperation
    HttpOperation operation = generateHttpOperation(inputRecord, workUnitState);
    BufferedRecord bufferedRecord = new BufferedRecord<>(operation, WriteCallback.EMPTY);

    // Convert HttpOperation to RQ
    Queue> buffer = new LinkedBlockingDeque<>();
    buffer.add(bufferedRecord);
    AsyncRequest request = this.requestBuilder.buildRequest(buffer);
    RQ rawRequest = request.getRawRequest();

    // Execute query and get response
    AsyncHttpJoinConverterContext context = new AsyncHttpJoinConverterContext(this, outputSchema, inputRecord, request);

    try {
      httpClient.sendAsyncRequest(rawRequest, context.getCallback());
    } catch (IOException e) {
      throw new DataConversionException(e);
    }

    return context.future;
  }

  public void close() throws IOException {
    this.httpClient.close();
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy