com.tigergraph.spark.write.TigerGraphStreamWriterFactory Maven / Gradle / Ivy
Show all versions of tigergraph-spark-connector Show documentation
/**
* Copyright (c) 2023 TigerGraph Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of the License at
*
*
http://www.apache.org/licenses/LICENSE-2.0
*
*
Unless required by applicable law or agreed to in writing, software distributed under the
* License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
* express or implied. See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.tigergraph.spark.write;
import com.tigergraph.spark.TigerGraphConnection;
import com.tigergraph.spark.log.LoggerFactory;
import com.tigergraph.spark.util.Options;
import org.apache.spark.sql.connector.write.streaming.StreamingDataWriterFactory;
import org.apache.spark.sql.types.StructType;
import org.slf4j.Logger;
/**
* A factory of {@link TigerGraphDataWriter} for streaming write, which is responsible for creating
* and initializing the actual data writer at executor side.
*/
public class TigerGraphStreamWriterFactory implements StreamingDataWriterFactory {
private static final Logger logger = LoggerFactory.getLogger(TigerGraphStreamWriterFactory.class);
private final StructType schema;
private final TigerGraphConnection conn;
TigerGraphStreamWriterFactory(StructType schema, TigerGraphConnection conn) {
this.schema = schema;
this.conn = conn;
logger.info("Created {} for executor", TigerGraphBatchWriterFactory.class);
}
@Override
public TigerGraphDataWriter createWriter(int partitionId, long taskId, long epochId) {
// re-init logger for spark executors
Options opts = conn.getOpts();
if (opts.containsOption(Options.LOG_LEVEL)) {
LoggerFactory.initJULLogger(opts.getInt(Options.LOG_LEVEL), opts.getString(Options.LOG_FILE));
}
logger.info(
"Create TigerGraph streaming writer for partitionId {}, taskId {}, epochId {}.",
partitionId,
taskId,
epochId);
return new TigerGraphDataWriter(schema, conn, partitionId, taskId, epochId);
}
}