io.prestosql.plugin.hive.HiveCoercionRecordCursor Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.prestosql.plugin.hive;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.collect.ImmutableList;
import io.airlift.slice.Slice;
import io.prestosql.plugin.hive.HivePageSourceProvider.ColumnMapping;
import io.prestosql.spi.PageBuilder;
import io.prestosql.spi.PrestoException;
import io.prestosql.spi.block.Block;
import io.prestosql.spi.block.BlockBuilder;
import io.prestosql.spi.connector.RecordCursor;
import io.prestosql.spi.type.Type;
import io.prestosql.spi.type.TypeManager;
import io.prestosql.spi.type.VarcharType;
import org.apache.hadoop.hive.serde2.typeinfo.ListTypeInfo;
import org.apache.hadoop.hive.serde2.typeinfo.MapTypeInfo;
import java.util.List;
import static io.airlift.slice.Slices.utf8Slice;
import static io.prestosql.plugin.hive.HiveType.HIVE_BYTE;
import static io.prestosql.plugin.hive.HiveType.HIVE_DOUBLE;
import static io.prestosql.plugin.hive.HiveType.HIVE_FLOAT;
import static io.prestosql.plugin.hive.HiveType.HIVE_INT;
import static io.prestosql.plugin.hive.HiveType.HIVE_LONG;
import static io.prestosql.plugin.hive.HiveType.HIVE_SHORT;
import static io.prestosql.plugin.hive.util.HiveUtil.extractStructFieldTypes;
import static io.prestosql.plugin.hive.util.HiveUtil.isArrayType;
import static io.prestosql.plugin.hive.util.HiveUtil.isMapType;
import static io.prestosql.plugin.hive.util.HiveUtil.isRowType;
import static io.prestosql.spi.StandardErrorCode.NOT_SUPPORTED;
import static java.lang.Float.intBitsToFloat;
import static java.lang.Math.min;
import static java.lang.String.format;
import static java.util.Objects.requireNonNull;
public class HiveCoercionRecordCursor
implements RecordCursor
{
private final RecordCursor delegate;
private final List columnMappings;
private final Coercer[] coercers;
public HiveCoercionRecordCursor(
List columnMappings,
TypeManager typeManager,
RecordCursor delegate)
{
requireNonNull(columnMappings, "columns is null");
requireNonNull(typeManager, "typeManager is null");
this.delegate = requireNonNull(delegate, "delegate is null");
this.columnMappings = ImmutableList.copyOf(columnMappings);
int size = columnMappings.size();
this.coercers = new Coercer[size];
BridgingRecordCursor bridgingRecordCursor = new BridgingRecordCursor();
for (int columnIndex = 0; columnIndex < size; columnIndex++) {
ColumnMapping columnMapping = columnMappings.get(columnIndex);
if (columnMapping.getBaseTypeCoercionFrom().isPresent()) {
coercers[columnIndex] = createCoercer(typeManager, columnMapping.getBaseTypeCoercionFrom().get(), columnMapping.getHiveColumnHandle().getHiveType(), bridgingRecordCursor);
}
}
}
@Override
public long getCompletedBytes()
{
return delegate.getCompletedBytes();
}
@Override
public Type getType(int field)
{
return delegate.getType(field);
}
@Override
public boolean advanceNextPosition()
{
for (int i = 0; i < columnMappings.size(); i++) {
if (coercers[i] != null) {
coercers[i].reset();
}
}
return delegate.advanceNextPosition();
}
@Override
public boolean getBoolean(int field)
{
if (coercers[field] == null) {
return delegate.getBoolean(field);
}
return coercers[field].getBoolean(delegate, field);
}
@Override
public long getLong(int field)
{
if (coercers[field] == null) {
return delegate.getLong(field);
}
return coercers[field].getLong(delegate, field);
}
@Override
public double getDouble(int field)
{
if (coercers[field] == null) {
return delegate.getDouble(field);
}
return coercers[field].getDouble(delegate, field);
}
@Override
public Slice getSlice(int field)
{
if (coercers[field] == null) {
return delegate.getSlice(field);
}
return coercers[field].getSlice(delegate, field);
}
@Override
public Object getObject(int field)
{
if (coercers[field] == null) {
return delegate.getObject(field);
}
return coercers[field].getObject(delegate, field);
}
@Override
public boolean isNull(int field)
{
if (coercers[field] == null) {
return delegate.isNull(field);
}
return coercers[field].isNull(delegate, field);
}
@Override
public void close()
{
delegate.close();
}
@Override
public long getReadTimeNanos()
{
return delegate.getReadTimeNanos();
}
@Override
public long getSystemMemoryUsage()
{
return delegate.getSystemMemoryUsage();
}
@VisibleForTesting
RecordCursor getRegularColumnRecordCursor()
{
return delegate;
}
private abstract static class Coercer
{
private boolean isNull;
private boolean loaded;
private boolean booleanValue;
private long longValue;
private double doubleValue;
private Slice sliceValue;
private Object objectValue;
public void reset()
{
isNull = false;
loaded = false;
}
public boolean isNull(RecordCursor delegate, int field)
{
assureLoaded(delegate, field);
return isNull;
}
public boolean getBoolean(RecordCursor delegate, int field)
{
assureLoaded(delegate, field);
return booleanValue;
}
public long getLong(RecordCursor delegate, int field)
{
assureLoaded(delegate, field);
return longValue;
}
public double getDouble(RecordCursor delegate, int field)
{
assureLoaded(delegate, field);
return doubleValue;
}
public Slice getSlice(RecordCursor delegate, int field)
{
assureLoaded(delegate, field);
return sliceValue;
}
public Object getObject(RecordCursor delegate, int field)
{
assureLoaded(delegate, field);
return objectValue;
}
private void assureLoaded(RecordCursor delegate, int field)
{
if (!loaded) {
isNull = delegate.isNull(field);
if (!isNull) {
coerce(delegate, field);
}
loaded = true;
}
}
protected abstract void coerce(RecordCursor delegate, int field);
protected void setBoolean(boolean value)
{
booleanValue = value;
}
protected void setLong(long value)
{
longValue = value;
}
protected void setDouble(double value)
{
doubleValue = value;
}
protected void setSlice(Slice value)
{
sliceValue = value;
}
protected void setObject(Object value)
{
objectValue = value;
}
protected void setIsNull(boolean isNull)
{
this.isNull = isNull;
}
}
private static Coercer createCoercer(TypeManager typeManager, HiveType fromHiveType, HiveType toHiveType, BridgingRecordCursor bridgingRecordCursor)
{
Type fromType = typeManager.getType(fromHiveType.getTypeSignature());
Type toType = typeManager.getType(toHiveType.getTypeSignature());
if (toType instanceof VarcharType && (fromHiveType.equals(HIVE_BYTE) || fromHiveType.equals(HIVE_SHORT) || fromHiveType.equals(HIVE_INT) || fromHiveType.equals(HIVE_LONG))) {
return new IntegerNumberToVarcharCoercer();
}
if (fromType instanceof VarcharType && (toHiveType.equals(HIVE_BYTE) || toHiveType.equals(HIVE_SHORT) || toHiveType.equals(HIVE_INT) || toHiveType.equals(HIVE_LONG))) {
return new VarcharToIntegerNumberCoercer(toHiveType);
}
if (fromHiveType.equals(HIVE_BYTE) && toHiveType.equals(HIVE_SHORT) || toHiveType.equals(HIVE_INT) || toHiveType.equals(HIVE_LONG)) {
return new IntegerNumberUpscaleCoercer();
}
if (fromHiveType.equals(HIVE_SHORT) && toHiveType.equals(HIVE_INT) || toHiveType.equals(HIVE_LONG)) {
return new IntegerNumberUpscaleCoercer();
}
if (fromHiveType.equals(HIVE_INT) && toHiveType.equals(HIVE_LONG)) {
return new IntegerNumberUpscaleCoercer();
}
if (fromHiveType.equals(HIVE_FLOAT) && toHiveType.equals(HIVE_DOUBLE)) {
return new FloatToDoubleCoercer();
}
if (isArrayType(fromType) && isArrayType(toType)) {
return new ListCoercer(typeManager, fromHiveType, toHiveType, bridgingRecordCursor);
}
if (isMapType(fromType) && isMapType(toType)) {
return new MapCoercer(typeManager, fromHiveType, toHiveType, bridgingRecordCursor);
}
if (isRowType(fromType) && isRowType(toType)) {
return new StructCoercer(typeManager, fromHiveType, toHiveType, bridgingRecordCursor);
}
throw new PrestoException(NOT_SUPPORTED, format("Unsupported coercion from %s to %s", fromHiveType, toHiveType));
}
private static class IntegerNumberUpscaleCoercer
extends Coercer
{
@Override
public void coerce(RecordCursor delegate, int field)
{
setLong(delegate.getLong(field));
}
}
private static class IntegerNumberToVarcharCoercer
extends Coercer
{
@Override
public void coerce(RecordCursor delegate, int field)
{
setSlice(utf8Slice(String.valueOf(delegate.getLong(field))));
}
}
private static class FloatToDoubleCoercer
extends Coercer
{
@Override
protected void coerce(RecordCursor delegate, int field)
{
setDouble(intBitsToFloat((int) delegate.getLong(field)));
}
}
private static class VarcharToIntegerNumberCoercer
extends Coercer
{
private final long maxValue;
private final long minValue;
public VarcharToIntegerNumberCoercer(HiveType type)
{
if (type.equals(HIVE_BYTE)) {
minValue = Byte.MIN_VALUE;
maxValue = Byte.MAX_VALUE;
}
else if (type.equals(HIVE_SHORT)) {
minValue = Short.MIN_VALUE;
maxValue = Short.MAX_VALUE;
}
else if (type.equals(HIVE_INT)) {
minValue = Integer.MIN_VALUE;
maxValue = Integer.MAX_VALUE;
}
else if (type.equals(HIVE_LONG)) {
minValue = Long.MIN_VALUE;
maxValue = Long.MAX_VALUE;
}
else {
throw new PrestoException(NOT_SUPPORTED, format("Could not create Coercer from varchar to %s", type));
}
}
@Override
public void coerce(RecordCursor delegate, int field)
{
try {
long value = Long.parseLong(delegate.getSlice(field).toStringUtf8());
if (minValue <= value && value <= maxValue) {
setLong(value);
}
else {
setIsNull(true);
}
}
catch (NumberFormatException e) {
setIsNull(true);
}
}
}
private static class ListCoercer
extends Coercer
{
private final Type fromElementType;
private final Type toType;
private final Type toElementType;
private final Coercer elementCoercer;
private final BridgingRecordCursor bridgingRecordCursor;
private final PageBuilder pageBuilder;
public ListCoercer(TypeManager typeManager, HiveType fromHiveType, HiveType toHiveType, BridgingRecordCursor bridgingRecordCursor)
{
requireNonNull(typeManager, "typeManage is null");
requireNonNull(fromHiveType, "fromHiveType is null");
requireNonNull(toHiveType, "toHiveType is null");
this.bridgingRecordCursor = requireNonNull(bridgingRecordCursor, "bridgingRecordCursor is null");
HiveType fromElementHiveType = HiveType.valueOf(((ListTypeInfo) fromHiveType.getTypeInfo()).getListElementTypeInfo().getTypeName());
HiveType toElementHiveType = HiveType.valueOf(((ListTypeInfo) toHiveType.getTypeInfo()).getListElementTypeInfo().getTypeName());
this.fromElementType = fromElementHiveType.getType(typeManager);
this.toType = toHiveType.getType(typeManager);
this.toElementType = toElementHiveType.getType(typeManager);
this.elementCoercer = fromElementHiveType.equals(toElementHiveType) ? null : createCoercer(typeManager, fromElementHiveType, toElementHiveType, bridgingRecordCursor);
this.pageBuilder = elementCoercer == null ? null : new PageBuilder(ImmutableList.of(toType));
}
@Override
public void coerce(RecordCursor delegate, int field)
{
if (delegate.isNull(field)) {
setIsNull(true);
return;
}
Block block = (Block) delegate.getObject(field);
if (pageBuilder.isFull()) {
pageBuilder.reset();
}
BlockBuilder blockBuilder = pageBuilder.getBlockBuilder(0);
BlockBuilder listBuilder = blockBuilder.beginBlockEntry();
for (int i = 0; i < block.getPositionCount(); i++) {
if (elementCoercer == null) {
toElementType.appendTo(block, i, listBuilder);
}
else {
if (block.isNull(i)) {
listBuilder.appendNull();
}
else {
rewriteBlock(fromElementType, toElementType, block, i, listBuilder, elementCoercer, bridgingRecordCursor);
}
}
}
blockBuilder.closeEntry();
pageBuilder.declarePosition();
setObject(toType.getObject(blockBuilder, blockBuilder.getPositionCount() - 1));
}
}
private static class MapCoercer
extends Coercer
{
private final List fromKeyValueTypes;
private final Type toType;
private final List toKeyValueTypes;
private final Coercer[] coercers;
private final BridgingRecordCursor bridgingRecordCursor;
private final PageBuilder pageBuilder;
public MapCoercer(TypeManager typeManager, HiveType fromHiveType, HiveType toHiveType, BridgingRecordCursor bridgingRecordCursor)
{
requireNonNull(typeManager, "typeManage is null");
requireNonNull(fromHiveType, "fromHiveType is null");
requireNonNull(toHiveType, "toHiveType is null");
this.bridgingRecordCursor = requireNonNull(bridgingRecordCursor, "bridgingRecordCursor is null");
HiveType fromKeyHiveType = HiveType.valueOf(((MapTypeInfo) fromHiveType.getTypeInfo()).getMapKeyTypeInfo().getTypeName());
HiveType fromValueHiveType = HiveType.valueOf(((MapTypeInfo) fromHiveType.getTypeInfo()).getMapValueTypeInfo().getTypeName());
HiveType toKeyHiveType = HiveType.valueOf(((MapTypeInfo) toHiveType.getTypeInfo()).getMapKeyTypeInfo().getTypeName());
HiveType toValueHiveType = HiveType.valueOf(((MapTypeInfo) toHiveType.getTypeInfo()).getMapValueTypeInfo().getTypeName());
this.fromKeyValueTypes = fromHiveType.getType(typeManager).getTypeParameters();
this.toType = toHiveType.getType(typeManager);
this.toKeyValueTypes = toType.getTypeParameters();
this.coercers = new Coercer[2];
coercers[0] = fromKeyHiveType.equals(toKeyHiveType) ? null : createCoercer(typeManager, fromKeyHiveType, toKeyHiveType, bridgingRecordCursor);
coercers[1] = fromValueHiveType.equals(toValueHiveType) ? null : createCoercer(typeManager, fromValueHiveType, toValueHiveType, bridgingRecordCursor);
this.pageBuilder = coercers[0] == null && coercers[1] == null ? null : new PageBuilder(ImmutableList.of(toType));
}
@Override
public void coerce(RecordCursor delegate, int field)
{
if (delegate.isNull(field)) {
setIsNull(true);
return;
}
Block block = (Block) delegate.getObject(field);
if (pageBuilder.isFull()) {
pageBuilder.reset();
}
BlockBuilder blockBuilder = pageBuilder.getBlockBuilder(0);
BlockBuilder mapBuilder = blockBuilder.beginBlockEntry();
for (int i = 0; i < block.getPositionCount(); i++) {
int k = i % 2;
if (coercers[k] == null) {
toKeyValueTypes.get(k).appendTo(block, i, mapBuilder);
}
else {
if (block.isNull(i)) {
mapBuilder.appendNull();
}
else {
rewriteBlock(fromKeyValueTypes.get(k), toKeyValueTypes.get(k), block, i, mapBuilder, coercers[k], bridgingRecordCursor);
}
}
}
blockBuilder.closeEntry();
pageBuilder.declarePosition();
setObject(toType.getObject(blockBuilder, blockBuilder.getPositionCount() - 1));
}
}
private static class StructCoercer
extends Coercer
{
private final Type toType;
private final List fromFieldTypes;
private final List toFieldTypes;
private final Coercer[] coercers;
private final BridgingRecordCursor bridgingRecordCursor;
private final PageBuilder pageBuilder;
public StructCoercer(TypeManager typeManager, HiveType fromHiveType, HiveType toHiveType, BridgingRecordCursor bridgingRecordCursor)
{
requireNonNull(typeManager, "typeManage is null");
requireNonNull(fromHiveType, "fromHiveType is null");
requireNonNull(toHiveType, "toHiveType is null");
this.bridgingRecordCursor = requireNonNull(bridgingRecordCursor, "bridgingRecordCursor is null");
List fromFieldHiveTypes = extractStructFieldTypes(fromHiveType);
List toFieldHiveTypes = extractStructFieldTypes(toHiveType);
this.fromFieldTypes = fromHiveType.getType(typeManager).getTypeParameters();
this.toType = toHiveType.getType(typeManager);
this.toFieldTypes = toType.getTypeParameters();
this.coercers = new Coercer[toFieldHiveTypes.size()];
for (int i = 0; i < min(fromFieldHiveTypes.size(), toFieldHiveTypes.size()); i++) {
if (!fromFieldTypes.get(i).equals(toFieldTypes.get(i))) {
coercers[i] = createCoercer(typeManager, fromFieldHiveTypes.get(i), toFieldHiveTypes.get(i), bridgingRecordCursor);
}
}
this.pageBuilder = new PageBuilder(ImmutableList.of(toType));
}
@Override
public void coerce(RecordCursor delegate, int field)
{
if (delegate.isNull(field)) {
setIsNull(true);
return;
}
Block block = (Block) delegate.getObject(field);
if (pageBuilder.isFull()) {
pageBuilder.reset();
}
BlockBuilder blockBuilder = pageBuilder.getBlockBuilder(0);
BlockBuilder rowBuilder = blockBuilder.beginBlockEntry();
for (int i = 0; i < toFieldTypes.size(); i++) {
if (i >= fromFieldTypes.size() || block.isNull(i)) {
rowBuilder.appendNull();
}
else if (coercers[i] == null) {
toFieldTypes.get(i).appendTo(block, i, rowBuilder);
}
else {
rewriteBlock(fromFieldTypes.get(i), toFieldTypes.get(i), block, i, rowBuilder, coercers[i], bridgingRecordCursor);
}
}
blockBuilder.closeEntry();
pageBuilder.declarePosition();
setObject(toType.getObject(blockBuilder, blockBuilder.getPositionCount() - 1));
}
}
private static void rewriteBlock(
Type fromType,
Type toType,
Block block,
int position,
BlockBuilder blockBuilder,
Coercer coercer,
BridgingRecordCursor bridgingRecordCursor)
{
Class> fromJavaType = fromType.getJavaType();
if (fromJavaType == long.class) {
bridgingRecordCursor.setValue(fromType.getLong(block, position));
}
else if (fromJavaType == double.class) {
bridgingRecordCursor.setValue(fromType.getDouble(block, position));
}
else if (fromJavaType == boolean.class) {
bridgingRecordCursor.setValue(fromType.getBoolean(block, position));
}
else if (fromJavaType == Slice.class) {
bridgingRecordCursor.setValue(fromType.getSlice(block, position));
}
else if (fromJavaType == Block.class) {
bridgingRecordCursor.setValue(fromType.getObject(block, position));
}
else {
bridgingRecordCursor.setValue(null);
}
coercer.reset();
Class> toJaveType = toType.getJavaType();
if (coercer.isNull(bridgingRecordCursor, 0)) {
blockBuilder.appendNull();
}
else if (toJaveType == long.class) {
toType.writeLong(blockBuilder, coercer.getLong(bridgingRecordCursor, 0));
}
else if (toJaveType == double.class) {
toType.writeDouble(blockBuilder, coercer.getDouble(bridgingRecordCursor, 0));
}
else if (toJaveType == boolean.class) {
toType.writeBoolean(blockBuilder, coercer.getBoolean(bridgingRecordCursor, 0));
}
else if (toJaveType == Slice.class) {
toType.writeSlice(blockBuilder, coercer.getSlice(bridgingRecordCursor, 0));
}
else if (toJaveType == Block.class) {
toType.writeObject(blockBuilder, coercer.getObject(bridgingRecordCursor, 0));
}
else {
throw new PrestoException(NOT_SUPPORTED, format("Unsupported coercion from %s to %s", fromType.getDisplayName(), toType.getDisplayName()));
}
coercer.reset();
bridgingRecordCursor.close();
}
private static class BridgingRecordCursor
implements RecordCursor
{
private Object value;
public void setValue(Object value)
{
this.value = value;
}
@Override
public long getCompletedBytes()
{
return 0;
}
@Override
public long getReadTimeNanos()
{
return 0;
}
@Override
public Type getType(int field)
{
throw new UnsupportedOperationException();
}
@Override
public boolean advanceNextPosition()
{
return true;
}
@Override
public boolean getBoolean(int field)
{
return (Boolean) value;
}
@Override
public long getLong(int field)
{
return (Long) value;
}
@Override
public double getDouble(int field)
{
return (Double) value;
}
@Override
public Slice getSlice(int field)
{
return (Slice) value;
}
@Override
public Object getObject(int field)
{
return value;
}
@Override
public boolean isNull(int field)
{
return value == null;
}
@Override
public void close()
{
this.value = null;
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy