org.apache.gobblin.converter.AsyncHttpJoinConverter Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.gobblin.converter;
import java.io.IOException;
import java.util.Queue;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.LinkedBlockingDeque;
import org.apache.avro.generic.GenericRecord;
import com.google.common.collect.ImmutableMap;
import com.typesafe.config.Config;
import com.typesafe.config.ConfigFactory;
import lombok.Getter;
import lombok.extern.slf4j.Slf4j;
import org.apache.gobblin.async.AsyncRequest;
import org.apache.gobblin.async.AsyncRequestBuilder;
import org.apache.gobblin.async.BufferedRecord;
import org.apache.gobblin.async.Callback;
import org.apache.gobblin.broker.gobblin_scopes.GobblinScopeTypes;
import org.apache.gobblin.broker.iface.SharedResourcesBroker;
import org.apache.gobblin.config.ConfigBuilder;
import org.apache.gobblin.configuration.ConfigurationKeys;
import org.apache.gobblin.configuration.State;
import org.apache.gobblin.configuration.WorkUnitState;
import org.apache.gobblin.http.HttpClient;
import org.apache.gobblin.http.HttpOperation;
import org.apache.gobblin.http.ResponseHandler;
import org.apache.gobblin.http.ResponseStatus;
import org.apache.gobblin.net.Request;
import org.apache.gobblin.utils.HttpConstants;
import org.apache.gobblin.writer.WriteCallback;
import edu.umd.cs.findbugs.annotations.SuppressWarnings;
/**
* This converter converts an input record (DI) to an output record (DO) which
* contains original input data and http request & response info.
*
* Sequence:
* Convert DI to HttpOperation
* Convert HttpOperation to RQ (by internal AsyncRequestBuilder)
* Execute http request, get response RP (by HttpClient)
* Combine info (DI, RQ, RP, status, etc..) to generate output DO
*/
@Slf4j
public abstract class AsyncHttpJoinConverter extends AsyncConverter1to1 {
public static final String CONF_PREFIX = "gobblin.converter.http.";
public static final Config DEFAULT_FALLBACK =
ConfigFactory.parseMap(ImmutableMap.builder()
.put(HttpConstants.CONTENT_TYPE, "application/json")
.put(HttpConstants.VERB, "GET")
.build());
protected HttpClient httpClient = null;
protected ResponseHandler responseHandler = null;
protected AsyncRequestBuilder requestBuilder = null;
protected boolean skipFailedRecord;
public AsyncHttpJoinConverter init(WorkUnitState workUnitState) {
super.init(workUnitState);
Config config = ConfigBuilder.create().loadProps(workUnitState.getProperties(), CONF_PREFIX).build();
config = config.withFallback(DEFAULT_FALLBACK);
skipFailedRecord = workUnitState.getPropAsBoolean(ConfigurationKeys.CONVERTER_SKIP_FAILED_RECORD, false);
httpClient = createHttpClient(config, workUnitState.getTaskBroker());
responseHandler = createResponseHandler(config);
requestBuilder = createRequestBuilder(config);
return this;
}
@Override
public final SO convertSchema(SI inputSchema, WorkUnitState workUnitState)
throws SchemaConversionException {
return convertSchemaImpl(inputSchema, workUnitState);
}
protected abstract HttpClient createHttpClient(Config config, SharedResourcesBroker broker);
protected abstract ResponseHandler createResponseHandler(Config config);
protected abstract AsyncRequestBuilder createRequestBuilder(Config config);
protected abstract HttpOperation generateHttpOperation (DI inputRecord, State state);
protected abstract SO convertSchemaImpl (SI inputSchema, WorkUnitState workUnitState) throws SchemaConversionException;
protected abstract DO convertRecordImpl (SO outputSchema, DI input, RQ rawRequest, ResponseStatus status) throws DataConversionException;
/**
* A helper class which performs the conversion from http response to DO type output, saved as a {@link CompletableFuture}
*/
private class AsyncHttpJoinConverterContext {
private final CompletableFuture future;
private final AsyncHttpJoinConverter converter;
@Getter
private final Callback © 2015 - 2025 Weber Informatics LLC | Privacy Policy