com.marklogic.flux.impl.importdata.ImportFilesCommand Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of flux-api Show documentation
Show all versions of flux-api Show documentation
Flux API for data movement with MarkLogic
/*
* Copyright © 2024 MarkLogic Corporation. All Rights Reserved.
*/
package com.marklogic.flux.impl.importdata;
import com.marklogic.flux.api.CompressionType;
import com.marklogic.flux.api.GenericFilesImporter;
import com.marklogic.flux.impl.OptionsUtil;
import com.marklogic.spark.Options;
import picocli.CommandLine;
import java.util.Map;
import java.util.function.Consumer;
@CommandLine.Command(
name = "import-files",
description = "Read local, HDFS, and S3 files and write the contents of each file as a document in MarkLogic."
)
public class ImportFilesCommand extends AbstractImportFilesCommand implements GenericFilesImporter {
@CommandLine.Mixin
private ReadGenericFilesParams readParams = new ReadGenericFilesParams();
@CommandLine.Mixin
private WriteGenericDocumentsParams writeParams = new WriteGenericDocumentsParams();
@Override
protected String getReadFormat() {
return MARKLOGIC_CONNECTOR;
}
@Override
protected ReadFilesParams getReadParams() {
return readParams;
}
@Override
protected WriteDocumentParams getWriteParams() {
return writeParams;
}
@Override
public GenericFilesImporter from(Consumer consumer) {
consumer.accept(readParams);
return this;
}
@Override
public GenericFilesImporter from(String... paths) {
readParams.paths(paths);
return this;
}
@Override
public GenericFilesImporter to(Consumer consumer) {
consumer.accept(writeParams);
return this;
}
public static class ReadGenericFilesParams extends ReadFilesParams implements ReadGenericFilesOptions {
@CommandLine.Option(names = "--compression", description = "When importing compressed files, specify the type of compression used. "
+ OptionsUtil.VALID_VALUES_DESCRIPTION)
private CompressionType compressionType;
@CommandLine.Option(names = "--encoding", description = "Specify an encoding when reading files.")
private String encoding;
@CommandLine.Option(names = "--partitions", description = "Specifies the number of partitions used for reading files.")
private int partitions;
@Override
public ReadGenericFilesOptions compressionType(CompressionType compressionType) {
this.compressionType = compressionType;
return this;
}
@Override
public ReadGenericFilesOptions encoding(String encoding) {
this.encoding = encoding;
return this;
}
@Override
public Map makeOptions() {
return OptionsUtil.addOptions(super.makeOptions(),
Options.READ_NUM_PARTITIONS, OptionsUtil.intOption(partitions),
Options.READ_FILES_COMPRESSION, compressionType != null ? compressionType.name() : null,
Options.READ_FILES_ENCODING, encoding
);
}
@Override
public ReadGenericFilesOptions partitions(int partitions) {
this.partitions = partitions;
return this;
}
}
public static class WriteGenericDocumentsParams extends WriteDocumentParams implements WriteGenericDocumentsOptions {
private DocumentType documentType;
@Override
@CommandLine.Option(
names = "--document-type",
description = "Forces a type for any document with an unrecognized URI extension. " + OptionsUtil.VALID_VALUES_DESCRIPTION
)
public WriteGenericDocumentsOptions documentType(DocumentType documentType) {
this.documentType = documentType;
return this;
}
@Override
public Map makeOptions() {
return OptionsUtil.addOptions(super.makeOptions(),
Options.WRITE_DOCUMENT_TYPE, documentType != null ? documentType.name() : null
);
}
}
}