org.apache.beam.sdk.io.PatchedSerializableAvroCodecFactory Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of scio-smb_2.13 Show documentation
Show all versions of scio-smb_2.13 Show documentation
Sort Merge Bucket source/sink implementations for Apache Beam
The newest version!
/*
* Copyright 2019 Spotify AB.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.beam.sdk.io;
import static org.apache.avro.file.DataFileConstants.BZIP2_CODEC;
import static org.apache.avro.file.DataFileConstants.DEFLATE_CODEC;
import static org.apache.avro.file.DataFileConstants.NULL_CODEC;
import static org.apache.avro.file.DataFileConstants.SNAPPY_CODEC;
import static org.apache.avro.file.DataFileConstants.XZ_CODEC;
import static org.apache.beam.vendor.guava.v32_1_2_jre.com.google.common.base.Preconditions.checkNotNull;
import static org.apache.beam.vendor.guava.v32_1_2_jre.com.google.common.base.Preconditions.checkState;
import com.spotify.scio.smb.annotations.PatchedFromBeam;
import java.io.Externalizable;
import java.io.IOException;
import java.io.ObjectInput;
import java.io.ObjectOutput;
import java.util.Arrays;
import java.util.List;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import javax.annotation.Nullable;
import org.apache.avro.file.CodecFactory;
/**
* A wrapper that allows {@link org.apache.avro.file.CodecFactory}s to be serialized using Java's
* standard serialization mechanisms.
*/
@PatchedFromBeam(origin = "org.apache.beam.sdk.io.SerializableAvroCodecFactory")
public class PatchedSerializableAvroCodecFactory implements Externalizable {
// Matches Beam 2.16.0
private static final long serialVersionUID = 7445324844109564303L;
private static final List noOptAvroCodecs =
Arrays.asList(NULL_CODEC, SNAPPY_CODEC, BZIP2_CODEC);
private static final Pattern deflatePattern = Pattern.compile(DEFLATE_CODEC + "-(?-?\\d)");
private static final Pattern xzPattern = Pattern.compile(XZ_CODEC + "-(?\\d)");
private @Nullable CodecFactory codecFactory;
// For java.io.Externalizable
public PatchedSerializableAvroCodecFactory() {}
public PatchedSerializableAvroCodecFactory(CodecFactory codecFactory) {
checkNotNull(codecFactory, "Codec can't be null");
checkState(checkIsSupportedCodec(codecFactory), "%s is not supported", codecFactory);
this.codecFactory = codecFactory;
}
private boolean checkIsSupportedCodec(CodecFactory codecFactory) {
final String codecStr = codecFactory.toString();
return noOptAvroCodecs.contains(codecStr)
|| deflatePattern.matcher(codecStr).matches()
|| xzPattern.matcher(codecStr).matches();
}
@Override
public void writeExternal(ObjectOutput out) throws IOException {
out.writeUTF(codecFactory.toString());
}
@Override
public void readExternal(ObjectInput in) throws IOException, ClassNotFoundException {
final String codecStr = in.readUTF();
switch (codecStr) {
case NULL_CODEC:
case SNAPPY_CODEC:
case BZIP2_CODEC:
codecFactory = CodecFactory.fromString(codecStr);
return;
}
Matcher deflateMatcher = deflatePattern.matcher(codecStr);
if (deflateMatcher.find()) {
codecFactory = CodecFactory.deflateCodec(Integer.parseInt(deflateMatcher.group("level")));
return;
}
Matcher xzMatcher = xzPattern.matcher(codecStr);
if (xzMatcher.find()) {
codecFactory = CodecFactory.xzCodec(Integer.parseInt(xzMatcher.group("level")));
return;
}
throw new IllegalStateException(codecStr + " is not supported");
}
public CodecFactory getCodec() {
return codecFactory;
}
@Override
public String toString() {
checkNotNull(codecFactory, "Inner CodecFactory is null, please use non default constructor");
return codecFactory.toString();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy