Please wait. This can take some minutes ...
Many resources are needed to download a project. Please understand that we have to compensate our server costs. Thank you in advance.
Project price only 1 $
You can buy this project and download/modify it how often you want.
com.facebook.presto.decoder.raw.RawColumnDecoder Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.facebook.presto.decoder.raw;
import com.facebook.presto.common.type.Type;
import com.facebook.presto.common.type.Varchars;
import com.facebook.presto.decoder.DecoderColumnHandle;
import com.facebook.presto.decoder.FieldValueProvider;
import com.facebook.presto.spi.PrestoException;
import com.facebook.presto.spi.StandardErrorCode;
import com.google.common.base.Joiner;
import com.google.common.collect.ImmutableList;
import io.airlift.slice.Slice;
import io.airlift.slice.Slices;
import java.nio.ByteBuffer;
import java.util.Arrays;
import java.util.Locale;
import java.util.Optional;
import java.util.OptionalInt;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import static com.facebook.presto.common.type.BigintType.BIGINT;
import static com.facebook.presto.common.type.BooleanType.BOOLEAN;
import static com.facebook.presto.common.type.DoubleType.DOUBLE;
import static com.facebook.presto.common.type.IntegerType.INTEGER;
import static com.facebook.presto.common.type.SmallintType.SMALLINT;
import static com.facebook.presto.common.type.TinyintType.TINYINT;
import static com.facebook.presto.common.type.Varchars.isVarcharType;
import static com.facebook.presto.decoder.DecoderErrorCode.DECODER_CONVERSION_NOT_SUPPORTED;
import static com.google.common.base.Preconditions.checkArgument;
import static com.google.common.base.Preconditions.checkState;
import static java.lang.Integer.parseInt;
import static java.lang.String.format;
import static java.util.Objects.requireNonNull;
public class RawColumnDecoder
{
private enum FieldType
{
BYTE(Byte.SIZE),
SHORT(Short.SIZE),
INT(Integer.SIZE),
LONG(Long.SIZE),
FLOAT(Float.SIZE),
DOUBLE(Double.SIZE);
private final int size;
FieldType(int bitSize)
{
this.size = bitSize / 8;
}
public int getSize()
{
return size;
}
}
private static final Pattern MAPPING_PATTERN = Pattern.compile("(\\d+)(?::(\\d+))?");
private final String columnName;
private final Type columnType;
private final FieldType fieldType;
private final int start;
private final OptionalInt end;
public RawColumnDecoder(DecoderColumnHandle columnHandle)
{
try {
requireNonNull(columnHandle, "columnHandle is null");
checkArgument(!columnHandle.isInternal(), "unexpected internal column '%s'", columnHandle.getName());
checkArgument(columnHandle.getFormatHint() == null, "unexpected format hint '%s' defined for column '%s'", columnHandle.getFormatHint(), columnHandle.getName());
columnName = columnHandle.getName();
columnType = columnHandle.getType();
try {
fieldType = columnHandle.getDataFormat() == null ?
FieldType.BYTE :
FieldType.valueOf(columnHandle.getDataFormat().toUpperCase(Locale.ENGLISH));
}
catch (IllegalArgumentException e) {
throw new IllegalArgumentException(format("invalid dataFormat '%s' for column '%s'", columnHandle.getDataFormat(), columnName));
}
String mapping = Optional.ofNullable(columnHandle.getMapping()).orElse("0");
Matcher mappingMatcher = MAPPING_PATTERN.matcher(mapping);
if (!mappingMatcher.matches()) {
throw new IllegalArgumentException(format("invalid mapping format '%s' for column '%s'", mapping, columnName));
}
start = parseInt(mappingMatcher.group(1));
if (mappingMatcher.group(2) != null) {
end = OptionalInt.of(parseInt(mappingMatcher.group(2)));
}
else {
if (!isVarcharType(columnType)) {
end = OptionalInt.of(start + fieldType.getSize());
}
else {
end = OptionalInt.empty();
}
}
checkArgument(start >= 0, "start offset %s for column '%s' must be greater or equal 0", start, columnName);
end.ifPresent(endValue -> {
checkArgument(endValue >= 0, "end offset %s for column '%s' must be greater or equal 0", endValue, columnName);
checkArgument(endValue >= start, "end offset %s for column '%s' must greater or equal start offset", endValue, columnName);
});
checkArgument(isSupportedType(columnType), "Unsupported column type '%s' for column '%s'", columnType.getDisplayName(), columnName);
if (columnType == BIGINT) {
checkFieldTypeOneOf(fieldType, columnName, FieldType.BYTE, FieldType.SHORT, FieldType.INT, FieldType.LONG);
}
if (columnType == INTEGER) {
checkFieldTypeOneOf(fieldType, columnName, FieldType.BYTE, FieldType.SHORT, FieldType.INT);
}
if (columnType == SMALLINT) {
checkFieldTypeOneOf(fieldType, columnName, FieldType.BYTE, FieldType.SHORT);
}
if (columnType == TINYINT) {
checkFieldTypeOneOf(fieldType, columnName, FieldType.BYTE);
}
if (columnType == BOOLEAN) {
checkFieldTypeOneOf(fieldType, columnName, FieldType.BYTE, FieldType.SHORT, FieldType.INT, FieldType.LONG);
}
if (columnType.equals(DOUBLE)) {
checkFieldTypeOneOf(fieldType, columnName, FieldType.DOUBLE, FieldType.FLOAT);
}
if (isVarcharType(columnType)) {
checkFieldTypeOneOf(fieldType, columnName, FieldType.BYTE);
}
if (!isVarcharType(columnType)) {
checkArgument(!end.isPresent() || end.getAsInt() - start == fieldType.getSize(),
"Bytes mapping for column '%s' does not match dataFormat '%s'; expected %s bytes but got %s",
columnName,
fieldType.getSize(),
end.getAsInt() - start);
}
}
catch (IllegalArgumentException e) {
throw new PrestoException(StandardErrorCode.GENERIC_USER_ERROR, e);
}
}
private static boolean isSupportedType(Type type)
{
if (isVarcharType(type)) {
return true;
}
if (ImmutableList.of(BIGINT, INTEGER, SMALLINT, TINYINT, BOOLEAN, DOUBLE).contains(type)) {
return true;
}
return false;
}
private void checkFieldTypeOneOf(FieldType declaredFieldType, String columnName, FieldType... allowedFieldTypes)
{
if (!Arrays.asList(allowedFieldTypes).contains(declaredFieldType)) {
throw new IllegalArgumentException(format(
"Wrong dataFormat '%s' specified for column '%s'; %s type implies use of %s",
declaredFieldType.name(),
columnName,
columnType.getDisplayName(),
Joiner.on("/").join(allowedFieldTypes)));
}
}
public FieldValueProvider decodeField(byte[] value)
{
requireNonNull(value, "value is null");
int actualEnd = end.orElse(value.length);
if (start > value.length) {
throw new PrestoException(DECODER_CONVERSION_NOT_SUPPORTED, format(
"start offset %s for column '%s' must be less that or equal to value length %s",
start,
columnName,
value.length));
}
if (actualEnd > value.length) {
throw new PrestoException(DECODER_CONVERSION_NOT_SUPPORTED, format(
"end offset %s for column '%s' must be less that or equal to value length %s",
actualEnd,
columnName,
value.length));
}
return new RawValueProvider(ByteBuffer.wrap(value, start, actualEnd - start), fieldType, columnName, columnType);
}
private static class RawValueProvider
extends FieldValueProvider
{
private final ByteBuffer value;
private final FieldType fieldType;
private final String columnName;
private final Type columnType;
private final int size;
public RawValueProvider(ByteBuffer value, FieldType fieldType, String columnName, Type columnType)
{
this.value = value;
this.fieldType = fieldType;
this.columnName = columnName;
this.columnType = columnType;
this.size = value.limit() - value.position();
}
@Override
public final boolean isNull()
{
return size == 0;
}
@Override
public boolean getBoolean()
{
checkEnoughBytes();
switch (fieldType) {
case BYTE:
return value.get() != 0;
case SHORT:
return value.getShort() != 0;
case INT:
return value.getInt() != 0;
case LONG:
return value.getLong() != 0;
default:
throw new PrestoException(DECODER_CONVERSION_NOT_SUPPORTED, format("conversion '%s' to boolean not supported", fieldType));
}
}
@Override
public long getLong()
{
checkEnoughBytes();
switch (fieldType) {
case BYTE:
return value.get();
case SHORT:
return value.getShort();
case INT:
return value.getInt();
case LONG:
return value.getLong();
default:
throw new PrestoException(DECODER_CONVERSION_NOT_SUPPORTED, format("conversion '%s' to long not supported", fieldType));
}
}
@Override
public double getDouble()
{
checkEnoughBytes();
switch (fieldType) {
case FLOAT:
return value.getFloat();
case DOUBLE:
return value.getDouble();
default:
throw new PrestoException(DECODER_CONVERSION_NOT_SUPPORTED, format("conversion '%s' to double not supported", fieldType));
}
}
private void checkEnoughBytes()
{
checkState(size >= fieldType.getSize(), "minimum byte size for column '%s' is %s, found %s,", columnName, fieldType.getSize(), size);
}
@Override
public Slice getSlice()
{
Slice slice = Slices.wrappedBuffer(value.slice());
return Varchars.truncateToLength(slice, columnType);
}
}
}