io.kestra.plugin.mongodb.AbstractLoad Maven / Gradle / Ivy
package io.kestra.plugin.mongodb;
import com.mongodb.bulk.BulkWriteResult;
import com.mongodb.client.MongoClient;
import com.mongodb.client.MongoCollection;
import com.mongodb.client.model.WriteModel;
import io.kestra.core.models.annotations.PluginProperty;
import io.kestra.core.models.executions.metrics.Counter;
import io.kestra.core.models.tasks.RunnableTask;
import io.kestra.core.runners.RunContext;
import io.kestra.core.serializers.FileSerde;
import io.swagger.v3.oas.annotations.media.Schema;
import lombok.*;
import lombok.experimental.SuperBuilder;
import org.bson.conversions.Bson;
import org.slf4j.Logger;
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.URI;
import java.util.ArrayList;
import java.util.List;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicLong;
import jakarta.validation.constraints.NotNull;
import reactor.core.publisher.Flux;
@SuperBuilder
@ToString
@EqualsAndHashCode
@Getter
@NoArgsConstructor
public abstract class AbstractLoad extends AbstractTask implements RunnableTask {
@Schema(
title = "The source file."
)
@PluginProperty(dynamic = true)
@NotNull
private String from;
@Schema(
title = "Chunk size for every bulk request."
)
@PluginProperty(dynamic = true)
@Builder.Default
private Integer chunk = 1000;
abstract protected Flux> source(RunContext runContext, BufferedReader inputStream) throws Exception;
@Override
public Output run(RunContext runContext) throws Exception {
Logger logger = runContext.logger();
URI from = new URI(runContext.render(this.from));
try (
MongoClient client = this.connection.client(runContext);
BufferedReader inputStream = new BufferedReader(new InputStreamReader(runContext.storage().getFile(from)), FileSerde.BUFFER_SIZE)
) {
MongoCollection collection = this.collection(runContext, client);
AtomicLong count = new AtomicLong();
AtomicInteger matchedCount = new AtomicInteger();
AtomicInteger insertedCount = new AtomicInteger();
AtomicInteger modifiedCount = new AtomicInteger();
AtomicInteger deletedCount = new AtomicInteger();
Flux flowable = this.source(runContext, inputStream)
.doOnNext(docWriteRequest -> {
count.incrementAndGet();
})
.buffer(this.chunk, this.chunk)
.map(indexRequests -> {
List> bulkOperations = new ArrayList<>(indexRequests);
return collection.bulkWrite(bulkOperations);
})
.doOnNext(bulkItemResponse -> {
matchedCount.addAndGet(bulkItemResponse.getMatchedCount());
insertedCount.addAndGet(bulkItemResponse.getInsertedCount());
modifiedCount.addAndGet(bulkItemResponse.getModifiedCount());
deletedCount.addAndGet(bulkItemResponse.getDeletedCount());
});
// metrics & finalize
Long requestCount = flowable.count().block();
runContext.metric(Counter.of(
"requests.count", requestCount,
"database", collection.getNamespace().getDatabaseName(),
"collection", collection.getNamespace().getCollectionName()
));
runContext.metric(Counter.of(
"records", count.get(),
"database", collection.getNamespace().getDatabaseName(),
"collection", collection.getNamespace().getCollectionName()
));
logger.info(
"Successfully sent {} requests for {} records",
requestCount,
count.get()
);
return Output.builder()
.size(count.get())
.matchedCount(matchedCount.get())
.insertedCount(insertedCount.get())
.modifiedCount(modifiedCount.get())
.deletedCount(deletedCount.get())
.build();
}
}
@Builder
@Getter
public static class Output implements io.kestra.core.models.tasks.Output {
@Schema(
title = "The number of rows processed."
)
private Long size;
@Schema(
title = "The number of documents inserted by the write operation."
)
@Builder.Default
private int insertedCount = 0;
@Schema(
title = "The number of documents matched by updates or replacements in the write operation."
)
@Builder.Default
private int matchedCount = 0;
@Schema(
title = "The number of documents deleted by the write operation."
)
@Builder.Default
private int deletedCount = 0;
@Schema(
title = "The number of documents modified by the write operation."
)
@Builder.Default
private int modifiedCount = 0;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy