All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.druid.data.input.avro.GenericAvroJsonProvider Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.apache.druid.data.input.avro;

import com.google.common.collect.ImmutableMap;
import org.apache.avro.Schema;
import org.apache.avro.generic.GenericEnumSymbol;
import org.apache.avro.generic.GenericFixed;
import org.apache.avro.generic.GenericRecord;
import org.apache.avro.util.Utf8;
import org.apache.druid.java.util.common.parsers.FlattenerJsonProvider;

import javax.annotation.Nullable;
import java.nio.ByteBuffer;
import java.util.Collection;
import java.util.Collections;
import java.util.List;
import java.util.Map;
import java.util.stream.Collectors;

/**
 * JsonProvider for JsonPath + Avro.
 */
public class GenericAvroJsonProvider extends FlattenerJsonProvider
{
  private final boolean extractUnionsByType;

  GenericAvroJsonProvider(final boolean extractUnionsByType)
  {
    this.extractUnionsByType = extractUnionsByType;
  }

  @Override
  public boolean isArray(final Object o)
  {
    return o instanceof List;
  }

  @Override
  public int length(final Object o)
  {
    if (o instanceof List) {
      return ((List) o).size();
    } else if (o instanceof GenericRecord) {
      return ((GenericRecord) o).getSchema().getFields().size();
    } else {
      return 0;
    }
  }

  @Override
  public Collection getPropertyKeys(final Object o)
  {
    if (o == null) {
      return Collections.emptySet();
    } else if (o instanceof Map) {
      return ((Map) o).keySet().stream().map(String::valueOf).collect(Collectors.toSet());
    } else if (o instanceof GenericRecord) {
      return ((GenericRecord) o).getSchema().getFields().stream().map(Schema.Field::name).collect(Collectors.toSet());
    } else {
      throw new UnsupportedOperationException("Unused");
    }
  }

  @Nullable
  @Override
  public Object getMapValue(final Object o, final String s)
  {
    if (o == null) {
      return null;
    } else if (o instanceof GenericRecord) {
      final GenericRecord record = (GenericRecord) o;
      if (extractUnionsByType && isExtractableUnion(record.getSchema().getField(s))) {
        return extractUnionTypes(record.get(s));
      }
      return record.get(s);
    } else if (o instanceof Map) {
      final Map theMap = (Map) o;
      if (theMap.containsKey(s)) {
        return theMap.get(s);
      } else {
        final Utf8 utf8Key = new Utf8(s);
        return theMap.get(utf8Key);
      }
    } else {
      throw new UnsupportedOperationException(o.getClass().getName());
    }
  }

  @Override
  public void setProperty(final Object o, final Object o1, final Object o2)
  {
    if (o instanceof Map) {
      ((Map) o).put(o1, o2);
    } else if (o instanceof GenericRecord) {
      ((GenericRecord) o).put(String.valueOf(o1), o2);
    } else {
      throw new UnsupportedOperationException();
    }
  }

  @Override
  public boolean isMap(final Object o)
  {
    return o == null || o instanceof Map || o instanceof GenericRecord;
  }

  private boolean isExtractableUnion(final Schema.Field field)
  {
    return field.schema().isUnion() &&
           field.schema().getTypes().stream().filter(type -> type.getType() != Schema.Type.NULL).count() > 1;
  }

  private Map extractUnionTypes(final Object o)
  {
    // Primitive types and unnamped complex types are keyed their type name.
    // Complex named types are keyed by their names.
    // This is safe because an Avro union can only contain a single member of each unnamed type and duplicates
    // of the same named type are not allowed. i.e only a single array is allowed, multiple records are allowed as
    // long as each has a unique name.
    // The Avro null type is elided as it's value can only ever be null
    if (o instanceof Integer) {
      return ImmutableMap.of("int", o);
    } else if (o instanceof Long) {
      return ImmutableMap.of("long", o);
    } else if (o instanceof Float) {
      return ImmutableMap.of("float", o);
    } else if (o instanceof Double) {
      return ImmutableMap.of("double", o);
    } else if (o instanceof Boolean) {
      return ImmutableMap.of("boolean", o);
    } else if (o instanceof Utf8) {
      return ImmutableMap.of("string", o);
    } else if (o instanceof ByteBuffer) {
      return ImmutableMap.of("bytes", o);
    } else if (o instanceof Map) {
      return ImmutableMap.of("map", o);
    } else if (o instanceof List) {
      return ImmutableMap.of("array", o);
    } else if (o instanceof GenericRecord) {
      return ImmutableMap.of(((GenericRecord) o).getSchema().getName(), o);
    } else if (o instanceof GenericFixed) {
      return ImmutableMap.of(((GenericFixed) o).getSchema().getName(), o);
    } else if (o instanceof GenericEnumSymbol) {
      return ImmutableMap.of(((GenericEnumSymbol) o).getSchema().getName(), o);
    }
    return ImmutableMap.of();
  }

  @Override
  public Object unwrap(final Object o)
  {
    if (o instanceof Utf8) {
      return o.toString();
    }

    return o;
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy