org.apache.hadoop.hive.serde2.lazy.LazyFactory Maven / Gradle / Ivy
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.hive.serde2.lazy;
import java.util.ArrayList;
import java.util.List;
import org.apache.hadoop.hive.serde2.SerDeException;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.LazyListObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.LazyMapObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.LazyObjectInspectorFactory;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.LazySimpleStructObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.LazyUnionObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyBinaryObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyBooleanObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyByteObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyDateObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyDoubleObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyFloatObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyHiveCharObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyHiveDecimalObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyHiveIntervalYearMonthObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyHiveIntervalDayTimeObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyHiveVarcharObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyIntObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyLongObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyObjectInspectorParameters;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyObjectInspectorParametersImpl;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyPrimitiveObjectInspectorFactory;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyShortObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyStringObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyTimestampObjectInspector;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyVoidObjectInspector;
import org.apache.hadoop.hive.serde2.lazydio.LazyDioBoolean;
import org.apache.hadoop.hive.serde2.lazydio.LazyDioByte;
import org.apache.hadoop.hive.serde2.lazydio.LazyDioDouble;
import org.apache.hadoop.hive.serde2.lazydio.LazyDioFloat;
import org.apache.hadoop.hive.serde2.lazydio.LazyDioInteger;
import org.apache.hadoop.hive.serde2.lazydio.LazyDioLong;
import org.apache.hadoop.hive.serde2.lazydio.LazyDioShort;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector.Category;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspectorFactory;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspectorFactory.ObjectInspectorOptions;
import org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector.PrimitiveCategory;
import org.apache.hadoop.hive.serde2.typeinfo.ListTypeInfo;
import org.apache.hadoop.hive.serde2.typeinfo.MapTypeInfo;
import org.apache.hadoop.hive.serde2.typeinfo.PrimitiveTypeInfo;
import org.apache.hadoop.hive.serde2.typeinfo.StructTypeInfo;
import org.apache.hadoop.hive.serde2.typeinfo.TypeInfo;
import org.apache.hadoop.hive.serde2.typeinfo.UnionTypeInfo;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.io.Writable;
/**
* LazyFactory.
*
*/
public final class LazyFactory {
/**
* Create a lazy primitive object instance given a primitive object inspector based on it's
* type. It takes a boolean switch to decide whether to return a binary or standard variant
* of the lazy object.
*
* @param poi PrimitiveObjectInspector
* @param typeBinary a switch to return either a LazyPrimtive class or it's binary
* companion
* @return LazyPrimitive extends ObjectInspector, ? extends Writable>
*/
public static LazyPrimitive extends ObjectInspector, ? extends Writable>
createLazyPrimitiveClass(PrimitiveObjectInspector poi, boolean typeBinary) {
if (typeBinary) {
return createLazyPrimitiveBinaryClass(poi);
} else {
return createLazyPrimitiveClass(poi);
}
}
/**
* Create a lazy primitive class given the type name.
*/
public static LazyPrimitive extends ObjectInspector, ? extends Writable>
createLazyPrimitiveClass(PrimitiveObjectInspector oi) {
PrimitiveCategory p = oi.getPrimitiveCategory();
switch (p) {
case BOOLEAN:
return new LazyBoolean((LazyBooleanObjectInspector) oi);
case BYTE:
return new LazyByte((LazyByteObjectInspector) oi);
case SHORT:
return new LazyShort((LazyShortObjectInspector) oi);
case INT:
return new LazyInteger((LazyIntObjectInspector) oi);
case LONG:
return new LazyLong((LazyLongObjectInspector) oi);
case FLOAT:
return new LazyFloat((LazyFloatObjectInspector) oi);
case DOUBLE:
return new LazyDouble((LazyDoubleObjectInspector) oi);
case STRING:
return new LazyString((LazyStringObjectInspector) oi);
case CHAR:
return new LazyHiveChar((LazyHiveCharObjectInspector) oi);
case VARCHAR:
return new LazyHiveVarchar((LazyHiveVarcharObjectInspector) oi);
case DATE:
return new LazyDate((LazyDateObjectInspector) oi);
case TIMESTAMP:
return new LazyTimestamp((LazyTimestampObjectInspector) oi);
case INTERVAL_YEAR_MONTH:
return new LazyHiveIntervalYearMonth((LazyHiveIntervalYearMonthObjectInspector) oi);
case INTERVAL_DAY_TIME:
return new LazyHiveIntervalDayTime((LazyHiveIntervalDayTimeObjectInspector) oi);
case BINARY:
return new LazyBinary((LazyBinaryObjectInspector) oi);
case DECIMAL:
return new LazyHiveDecimal((LazyHiveDecimalObjectInspector) oi);
case VOID:
return new LazyVoid((LazyVoidObjectInspector) oi);
default:
throw new RuntimeException("Internal error: no LazyObject for " + p);
}
}
public static LazyPrimitive extends ObjectInspector, ? extends Writable>
createLazyPrimitiveBinaryClass(PrimitiveObjectInspector poi) {
PrimitiveCategory pc = poi.getPrimitiveCategory();
switch (pc) {
case BOOLEAN:
return new LazyDioBoolean((LazyBooleanObjectInspector) poi);
case BYTE:
return new LazyDioByte((LazyByteObjectInspector) poi);
case SHORT:
return new LazyDioShort((LazyShortObjectInspector) poi);
case INT:
return new LazyDioInteger((LazyIntObjectInspector) poi);
case LONG:
return new LazyDioLong((LazyLongObjectInspector) poi);
case FLOAT:
return new LazyDioFloat((LazyFloatObjectInspector) poi);
case DOUBLE:
return new LazyDioDouble((LazyDoubleObjectInspector) poi);
default:
throw new RuntimeException("Hive Internal Error: no LazyObject for " + poi);
}
}
/**
* Create a hierarchical LazyObject based on the given typeInfo.
*/
public static LazyObject extends ObjectInspector> createLazyObject(ObjectInspector oi) {
ObjectInspector.Category c = oi.getCategory();
switch (c) {
case PRIMITIVE:
return createLazyPrimitiveClass((PrimitiveObjectInspector) oi);
case MAP:
return new LazyMap((LazyMapObjectInspector) oi);
case LIST:
return new LazyArray((LazyListObjectInspector) oi);
case STRUCT:
return new LazyStruct((LazySimpleStructObjectInspector) oi);
case UNION:
return new LazyUnion((LazyUnionObjectInspector) oi);
}
throw new RuntimeException("Hive LazySerDe Internal error.");
}
/**
* Creates a LazyObject based on the LazyObjectInspector. Will create binary variants for
* primitive objects when the switch typeBinary
is specified as true.
*
* @param oi ObjectInspector
* @param typeBinary Boolean value used as switch to return variants of LazyPrimitive
* objects which are initialized from a binary format for the data.
* @return LazyObject extends ObjectInspector>
*/
public static LazyObject extends ObjectInspector>
createLazyObject(ObjectInspector oi, boolean typeBinary) {
if (oi.getCategory() == Category.PRIMITIVE) {
return createLazyPrimitiveClass((PrimitiveObjectInspector) oi, typeBinary);
} else {
return createLazyObject(oi);
}
}
/**
* Create a hierarchical ObjectInspector for LazyObject with the given
* typeInfo.
*
* @param typeInfo
* The type information for the LazyObject
* @param separator
* The array of separators for delimiting each level
* @param separatorIndex
* The current level (for separators). List(array), struct uses 1
* level of separator, and map uses 2 levels: the first one for
* delimiting entries, the second one for delimiting key and values.
* @param nullSequence
* The sequence of bytes representing NULL.
* @return The ObjectInspector
* @throws SerDeException
*/
@Deprecated
public static ObjectInspector createLazyObjectInspector(TypeInfo typeInfo,
byte[] separators, int separatorIndex, Text nullSequence, boolean escaped,
byte escapeChar, ObjectInspectorOptions option) throws SerDeException {
return createLazyObjectInspector(typeInfo, separators, separatorIndex, nullSequence,
escaped, escapeChar, false, option);
}
/**
* Create a hierarchical ObjectInspector for LazyObject with the given
* typeInfo.
*
* @param typeInfo
* The type information for the LazyObject
* @param separator
* The array of separators for delimiting each level
* @param separatorIndex
* The current level (for separators). List(array), struct uses 1
* level of separator, and map uses 2 levels: the first one for
* delimiting entries, the second one for delimiting key and values.
* @param nullSequence
* The sequence of bytes representing NULL.
* @return The ObjectInspector
* @throws SerDeException
*/
@Deprecated
public static ObjectInspector createLazyObjectInspector(TypeInfo typeInfo,
byte[] separators, int separatorIndex, Text nullSequence, boolean escaped,
byte escapeChar) throws SerDeException {
return createLazyObjectInspector(typeInfo, separators, separatorIndex, nullSequence,
escaped, escapeChar, false, ObjectInspectorOptions.JAVA);
}
/**
* Create a hierarchical ObjectInspector for LazyObject with the given typeInfo.
*
* @param typeInfo The type information for the LazyObject
* @param separator The array of separators for delimiting each level
* @param separatorIndex The current level (for separators). List(array), struct uses 1 level of
* separator, and map uses 2 levels: the first one for delimiting entries, the second one
* for delimiting key and values.
* @param nullSequence The sequence of bytes representing NULL.
* @param extendedBooleanLiteral whether extended boolean literal set is legal
* @param option the {@link ObjectInspectorOption}
* @return The ObjectInspector
* @throws SerDeException
*/
@Deprecated
public static ObjectInspector createLazyObjectInspector(TypeInfo typeInfo,
byte[] separators, int separatorIndex, Text nullSequence, boolean escaped,
byte escapeChar, boolean extendedBooleanLiteral) throws SerDeException {
return createLazyObjectInspector(typeInfo, separators, separatorIndex, nullSequence, escaped,
escapeChar, extendedBooleanLiteral, ObjectInspectorOptions.JAVA);
}
/**
* Create a hierarchical ObjectInspector for LazyObject with the given typeInfo.
*
* @param typeInfo The type information for the LazyObject
* @param separator The array of separators for delimiting each level
* @param separatorIndex The current level (for separators). List(array), struct uses 1 level of
* separator, and map uses 2 levels: the first one for delimiting entries, the second one
* for delimiting key and values.
* @param nullSequence The sequence of bytes representing NULL.
* @param extendedBooleanLiteral whether extended boolean literal set is legal
* @param option the {@link ObjectInspectorOption}
* @return The ObjectInspector
* @throws SerDeException
*/
@Deprecated
public static ObjectInspector createLazyObjectInspector(TypeInfo typeInfo,
byte[] separators, int separatorIndex, Text nullSequence, boolean escaped,
byte escapeChar, boolean extendedBooleanLiteral, ObjectInspectorOptions option) throws SerDeException {
LazyObjectInspectorParametersImpl lazyParams = new LazyObjectInspectorParametersImpl(
escaped, escapeChar, extendedBooleanLiteral, null, separators, nullSequence);
return createLazyObjectInspector(typeInfo, separatorIndex, lazyParams, option);
}
/**
* Create a hierarchical ObjectInspector for LazyObject with the given typeInfo.
*
* @param typeInfo The type information for the LazyObject
* @param separator The array of separators for delimiting each level
* @param separatorIndex The current level (for separators). List(array), struct uses 1 level of
* separator, and map uses 2 levels: the first one for delimiting entries, the second one
* for delimiting key and values.
* @param lazyParams Params for lazy types
* @param option the {@link ObjectInspectorOption}
* @return The ObjectInspector
* @throws SerDeException
*/
public static ObjectInspector createLazyObjectInspector(TypeInfo typeInfo,
int separatorIndex, LazyObjectInspectorParameters lazyParams,
ObjectInspectorOptions option) throws SerDeException {
ObjectInspector.Category c = typeInfo.getCategory();
switch (c) {
case PRIMITIVE:
return LazyPrimitiveObjectInspectorFactory.getLazyObjectInspector(
(PrimitiveTypeInfo) typeInfo, lazyParams);
case MAP:
return LazyObjectInspectorFactory.getLazySimpleMapObjectInspector(
createLazyObjectInspector(((MapTypeInfo) typeInfo).getMapKeyTypeInfo(),
separatorIndex + 2, lazyParams, option),
createLazyObjectInspector(((MapTypeInfo) typeInfo).getMapValueTypeInfo(),
separatorIndex + 2, lazyParams, option),
LazyUtils.getSeparator(lazyParams.getSeparators(), separatorIndex),
LazyUtils.getSeparator(lazyParams.getSeparators(), separatorIndex+1),
lazyParams);
case LIST:
return LazyObjectInspectorFactory.getLazySimpleListObjectInspector(
createLazyObjectInspector(((ListTypeInfo) typeInfo)
.getListElementTypeInfo(), separatorIndex + 1,
lazyParams, option), LazyUtils.getSeparator(lazyParams.getSeparators(), separatorIndex),
lazyParams);
case STRUCT:
StructTypeInfo structTypeInfo = (StructTypeInfo) typeInfo;
List fieldNames = structTypeInfo.getAllStructFieldNames();
List fieldTypeInfos = structTypeInfo
.getAllStructFieldTypeInfos();
List fieldObjectInspectors = new ArrayList(
fieldTypeInfos.size());
for (int i = 0; i < fieldTypeInfos.size(); i++) {
fieldObjectInspectors.add(createLazyObjectInspector(fieldTypeInfos
.get(i), separatorIndex + 1, lazyParams, option));
}
return LazyObjectInspectorFactory.getLazySimpleStructObjectInspector(
fieldNames, fieldObjectInspectors, null,
LazyUtils.getSeparator(lazyParams.getSeparators(), separatorIndex),
lazyParams, option);
case UNION:
UnionTypeInfo unionTypeInfo = (UnionTypeInfo) typeInfo;
List lazyOIs = new ArrayList();
for (TypeInfo uti : unionTypeInfo.getAllUnionObjectTypeInfos()) {
lazyOIs.add(createLazyObjectInspector(uti,
separatorIndex + 1, lazyParams, option));
}
return LazyObjectInspectorFactory.getLazyUnionObjectInspector(lazyOIs,
LazyUtils.getSeparator(lazyParams.getSeparators(), separatorIndex),
lazyParams);
}
throw new RuntimeException("Hive LazySerDe Internal error.");
}
/**
* Create a hierarchical ObjectInspector for LazyStruct with the given
* columnNames and columnTypeInfos.
*
* @param lastColumnTakesRest
* whether the last column of the struct should take the rest of the
* row if there are extra fields.
* @throws SerDeException
* @see LazyFactory#createLazyObjectInspector(TypeInfo, byte[], int, Text,
* boolean, byte)
*/
@Deprecated
public static ObjectInspector createLazyStructInspector(
List columnNames, List typeInfos, byte[] separators,
Text nullSequence, boolean lastColumnTakesRest, boolean escaped,
byte escapeChar) throws SerDeException {
return createLazyStructInspector(columnNames, typeInfos, separators,
nullSequence, lastColumnTakesRest, escaped, escapeChar, false);
}
/**
* Create a hierarchical ObjectInspector for LazyStruct with the given
* columnNames and columnTypeInfos.
*
* @param lastColumnTakesRest
* whether the last column of the struct should take the rest of the
* row if there are extra fields.
* @param extendedBooleanLiteral whether extended boolean literal set is legal
* @throws SerDeException
* @see LazyFactory#createLazyObjectInspector(TypeInfo, byte[], int, Text,
* boolean, byte)
*/
@Deprecated
public static ObjectInspector createLazyStructInspector(
List columnNames, List typeInfos, byte[] separators,
Text nullSequence, boolean lastColumnTakesRest, boolean escaped,
byte escapeChar, boolean extendedBooleanLiteral) throws SerDeException {
LazyObjectInspectorParametersImpl lazyParams = new LazyObjectInspectorParametersImpl(
escaped, escapeChar, extendedBooleanLiteral, null, separators, nullSequence, lastColumnTakesRest);
return createLazyStructInspector(columnNames, typeInfos, lazyParams);
}
/**
* Create a hierarchical ObjectInspector for LazyStruct with the given
* columnNames and columnTypeInfos.
*
* @param lastColumnTakesRest
* whether the last column of the struct should take the rest of the
* row if there are extra fields.
* @param lazyParams parameters for the lazy types
* @throws SerDeException
* @see LazyFactory#createLazyObjectInspector(TypeInfo, byte[], int, Text,
* boolean, byte)
*/
public static ObjectInspector createLazyStructInspector(
List columnNames, List typeInfos,
LazyObjectInspectorParameters lazyParams) throws SerDeException {
ArrayList columnObjectInspectors = new ArrayList(
typeInfos.size());
for (int i = 0; i < typeInfos.size(); i++) {
columnObjectInspectors.add(LazyFactory.createLazyObjectInspector(
typeInfos.get(i), 1,
lazyParams, ObjectInspectorOptions.JAVA));
}
return LazyObjectInspectorFactory.getLazySimpleStructObjectInspector(
columnNames, columnObjectInspectors, null, lazyParams.getSeparators()[0],
lazyParams, ObjectInspectorOptions.JAVA);
}
/**
* Create a hierarchical ObjectInspector for ColumnarStruct with the given
* columnNames and columnTypeInfos.
* @throws SerDeException
*
* @see LazyFactory#createLazyObjectInspector(TypeInfo, byte[], int, Text,
* boolean, byte)
*/
@Deprecated
public static ObjectInspector createColumnarStructInspector(
List columnNames, List columnTypes, byte[] separators,
Text nullSequence, boolean escaped, byte escapeChar) throws SerDeException {
LazyObjectInspectorParametersImpl lazyParams = new LazyObjectInspectorParametersImpl(
escaped, escapeChar, false, null, separators, nullSequence);
return createColumnarStructInspector(columnNames, columnTypes, lazyParams);
}
/**
* Create a hierarchical ObjectInspector for ColumnarStruct with the given
* columnNames and columnTypeInfos.
* @throws SerDeException
*
* @see LazyFactory#createLazyObjectInspector(TypeInfo, byte[], int, Text,
* boolean, byte)
*/
public static ObjectInspector createColumnarStructInspector(
List columnNames, List columnTypes,
LazyObjectInspectorParameters lazyParams) throws SerDeException {
ArrayList columnObjectInspectors = new ArrayList(
columnTypes.size());
for (int i = 0; i < columnTypes.size(); i++) {
columnObjectInspectors
.add(LazyFactory.createLazyObjectInspector(columnTypes.get(i), 1,
lazyParams, ObjectInspectorOptions.JAVA));
}
return ObjectInspectorFactory.getColumnarStructObjectInspector(columnNames,
columnObjectInspectors);
}
private LazyFactory() {
// prevent instantiation
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy