org.apache.hadoop.hive.serde2.lazy.LazyBinary Maven / Gradle / Ivy
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.hive.serde2.lazy;
import org.apache.commons.codec.binary.Base64;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.apache.hadoop.hive.serde2.lazy.objectinspector.primitive.LazyBinaryObjectInspector;
import org.apache.hadoop.io.BytesWritable;
public class LazyBinary extends LazyPrimitive {
private static final Logger LOG = LoggerFactory.getLogger(LazyBinary.class);
private static final boolean DEBUG_LOG_ENABLED = LOG.isDebugEnabled();
public LazyBinary(LazyBinaryObjectInspector oi) {
super(oi);
data = new BytesWritable();
}
public LazyBinary(LazyBinary other){
super(other);
BytesWritable incoming = other.getWritableObject();
byte[] bytes = new byte[incoming.getLength()];
System.arraycopy(incoming.getBytes(), 0, bytes, 0, incoming.getLength());
data = new BytesWritable(bytes);
}
@Override
public void init(ByteArrayRef bytes, int start, int length) {
super.init(bytes, start, length);
byte[] recv = new byte[length];
System.arraycopy(bytes.getData(), start, recv, 0, length);
byte[] decoded = decodeIfNeeded(recv);
// use the original bytes in case decoding should fail
decoded = decoded.length > 0 ? decoded : recv;
data.set(decoded, 0, decoded.length);
}
// todo this should be configured in serde
public static byte[] decodeIfNeeded(byte[] recv) {
boolean arrayByteBase64 = Base64.isArrayByteBase64(recv);
if (DEBUG_LOG_ENABLED && arrayByteBase64) {
LOG.debug("Data only contains Base64 alphabets only so try to decode the data.");
}
return arrayByteBase64 ? Base64.decodeBase64(recv) : recv;
}
}