All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.beam.sdk.coders.StandardCoder Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.beam.sdk.coders;

import static com.google.common.base.Preconditions.checkNotNull;
import static org.apache.beam.sdk.util.Structs.addList;
import static org.apache.beam.sdk.util.Structs.addString;
import static org.apache.beam.sdk.util.Structs.addStringList;

import com.google.common.collect.Lists;
import com.google.common.io.ByteStreams;
import com.google.common.io.CountingOutputStream;
import java.io.ByteArrayOutputStream;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;
import java.util.List;
import org.apache.beam.sdk.util.CloudObject;
import org.apache.beam.sdk.util.PropertyNames;
import org.apache.beam.sdk.util.common.ElementByteSizeObserver;
import org.apache.beam.sdk.values.TypeDescriptor;

/**
 * An abstract base class to implement a {@link Coder} that defines equality, hashing, and printing
 * via the class name and recursively using {@link #getComponents}.
 *
 * 

To extend {@link StandardCoder}, override the following methods as appropriate: * *

    *
  • {@link #getComponents}: the default implementation returns {@link #getCoderArguments}.
  • *
  • {@link #getEncodedElementByteSize} and * {@link #isRegisterByteSizeObserverCheap}: the * default implementation encodes values to bytes and counts the bytes, which is considered * expensive.
  • *
  • {@link #getEncodingId} and {@link #getAllowedEncodings}: by default, the encoding id * is the empty string, so only the canonical name of the subclass will be used for * compatibility checks, and no other encoding ids are allowed.
  • *
*/ public abstract class StandardCoder implements Coder { protected StandardCoder() {} @Override public String getEncodingId() { return ""; } @Override public Collection getAllowedEncodings() { return Collections.emptyList(); } /** * Returns the list of {@link Coder Coders} that are components of this {@link Coder}. */ public List> getComponents() { List> coderArguments = getCoderArguments(); if (coderArguments == null) { return Collections.emptyList(); } else { return coderArguments; } } /** * {@inheritDoc} * * @return {@code true} if the two {@link StandardCoder} instances have the * same class and equal components. */ @Override public boolean equals(Object o) { if (o == null || this.getClass() != o.getClass()) { return false; } StandardCoder that = (StandardCoder) o; return this.getComponents().equals(that.getComponents()); } @Override public int hashCode() { return getClass().hashCode() * 31 + getComponents().hashCode(); } @Override public String toString() { StringBuilder builder = new StringBuilder(); String s = getClass().getName(); builder.append(s.substring(s.lastIndexOf('.') + 1)); List> componentCoders = getComponents(); if (!componentCoders.isEmpty()) { builder.append('('); boolean first = true; for (Coder componentCoder : componentCoders) { if (first) { first = false; } else { builder.append(','); } builder.append(componentCoder.toString()); } builder.append(')'); } return builder.toString(); } /** * Adds the following properties to the {@link CloudObject} representation: *
    *
  • component_encodings: A list of coders represented as {@link CloudObject}s * equivalent to the {@link #getCoderArguments}.
  • *
  • encoding_id: An identifier for the binary format written by {@link #encode}. See * {@link #getEncodingId} for further details.
  • *
  • allowed_encodings: A collection of encodings supported by {@link #decode} in * addition to the encoding from {@link #getEncodingId()} (which is assumed supported). * See {@link #getAllowedEncodings} for further details.
  • *
* *

{@link StandardCoder} implementations should override {@link #initializeCloudObject} * to customize the {@link CloudObject} representation. */ @Override public final CloudObject asCloudObject() { CloudObject result = initializeCloudObject(); List> components = getComponents(); if (!components.isEmpty()) { List cloudComponents = new ArrayList<>(components.size()); for (Coder coder : components) { cloudComponents.add(coder.asCloudObject()); } addList(result, PropertyNames.COMPONENT_ENCODINGS, cloudComponents); } String encodingId = getEncodingId(); checkNotNull(encodingId, "Coder.getEncodingId() must not return null."); if (!encodingId.isEmpty()) { addString(result, PropertyNames.ENCODING_ID, encodingId); } Collection allowedEncodings = getAllowedEncodings(); if (!allowedEncodings.isEmpty()) { addStringList(result, PropertyNames.ALLOWED_ENCODINGS, Lists.newArrayList(allowedEncodings)); } return result; } /** * Subclasses should override this method to customize the {@link CloudObject} * representation. {@link StandardCoder#asCloudObject} delegates to this method * to provide an initial {@link CloudObject}. * *

The default implementation returns a {@link CloudObject} using * {@link Object#getClass} for the type. */ protected CloudObject initializeCloudObject() { return CloudObject.forClass(getClass()); } /** * {@inheritDoc} * * @return {@code false} unless it is overridden. {@link StandardCoder#registerByteSizeObserver} * invokes {@link #getEncodedElementByteSize} which requires re-encoding an element * unless it is overridden. This is considered expensive. */ @Override public boolean isRegisterByteSizeObserverCheap(T value, Context context) { return false; } /** * Returns the size in bytes of the encoded value using this coder. */ protected long getEncodedElementByteSize(T value, Context context) throws Exception { try { CountingOutputStream os = new CountingOutputStream(ByteStreams.nullOutputStream()); encode(value, os, context); return os.getCount(); } catch (Exception exn) { throw new IllegalArgumentException( "Unable to encode element '" + value + "' with coder '" + this + "'.", exn); } } /** * {@inheritDoc} * *

For {@link StandardCoder} subclasses, this notifies {@code observer} about the byte size * of the encoded value using this coder as returned by {@link #getEncodedElementByteSize}. */ @Override public void registerByteSizeObserver( T value, ElementByteSizeObserver observer, Context context) throws Exception { observer.update(getEncodedElementByteSize(value, context)); } protected void verifyDeterministic(String message, Iterable> coders) throws NonDeterministicException { for (Coder coder : coders) { try { coder.verifyDeterministic(); } catch (NonDeterministicException e) { throw new NonDeterministicException(this, message, e); } } } protected void verifyDeterministic(String message, Coder... coders) throws NonDeterministicException { verifyDeterministic(message, Arrays.asList(coders)); } /** * {@inheritDoc} * * @return {@code false} for {@link StandardCoder} unless overridden. */ @Override public boolean consistentWithEquals() { return false; } @Override public Object structuralValue(T value) throws Exception { if (value != null && consistentWithEquals()) { return value; } else { try { ByteArrayOutputStream os = new ByteArrayOutputStream(); encode(value, os, Context.OUTER); return new StructuralByteArray(os.toByteArray()); } catch (Exception exn) { throw new IllegalArgumentException( "Unable to encode element '" + value + "' with coder '" + this + "'.", exn); } } } @SuppressWarnings("unchecked") @Override public TypeDescriptor getEncodedTypeDescriptor() { return (TypeDescriptor) TypeDescriptor.of(getClass()).resolveType(new TypeDescriptor() {}.getType()); } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy