org.apache.avro.tool.DataFileReadTool Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of avro-tools Show documentation
Show all versions of avro-tools Show documentation
Avro command line tools and utilities
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* https://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.avro.tool;
import java.io.BufferedInputStream;
import java.io.InputStream;
import java.io.PrintStream;
import java.util.ArrayList;
import java.util.List;
import joptsimple.OptionParser;
import joptsimple.OptionSet;
import joptsimple.OptionSpec;
import org.apache.avro.AvroRuntimeException;
import org.apache.avro.Schema;
import org.apache.avro.file.DataFileStream;
import org.apache.avro.io.DatumWriter;
import org.apache.avro.generic.GenericDatumReader;
import org.apache.avro.generic.GenericDatumWriter;
import org.apache.avro.io.EncoderFactory;
import org.apache.avro.io.JsonEncoder;
/** Reads a data file and dumps to JSON */
public class DataFileReadTool implements Tool {
private static final long DEFAULT_HEAD_COUNT = 10;
@Override
public String getName() {
return "tojson";
}
@Override
public String getShortDescription() {
return "Dumps an Avro data file as JSON, record per line or pretty.";
}
@Override
public int run(InputStream stdin, PrintStream out, PrintStream err, List args) throws Exception {
OptionParser optionParser = new OptionParser();
OptionSpec prettyOption = optionParser.accepts("pretty", "Turns on pretty printing.");
String headDesc = String.format("Converts the first X records (default is %d).", DEFAULT_HEAD_COUNT);
OptionSpec headOption = optionParser.accepts("head", headDesc).withOptionalArg();
OptionSpec readerSchemaFileOption = optionParser.accepts("reader-schema-file", "Reader schema file")
.withOptionalArg().ofType(String.class);
OptionSpec readerSchemaOption = optionParser.accepts("reader-schema", "Reader schema").withOptionalArg()
.ofType(String.class);
OptionSet optionSet = optionParser.parse(args.toArray(new String[0]));
Boolean pretty = optionSet.has(prettyOption);
List nargs = new ArrayList<>((List) optionSet.nonOptionArguments());
String readerSchemaStr = readerSchemaOption.value(optionSet);
String readerSchemaFile = readerSchemaFileOption.value(optionSet);
Schema readerSchema = null;
if (readerSchemaFile != null) {
readerSchema = Util.parseSchemaFromFS(readerSchemaFile);
} else if (readerSchemaStr != null) {
readerSchema = new Schema.Parser().parse(readerSchemaStr);
}
long headCount = getHeadCount(optionSet, headOption, nargs);
if (nargs.size() != 1) {
printHelp(err);
err.println();
optionParser.printHelpOn(err);
return 1;
}
BufferedInputStream inStream = Util.fileOrStdin(nargs.get(0), stdin);
GenericDatumReader
© 2015 - 2025 Weber Informatics LLC | Privacy Policy