All Downloads are FREE. Search and download functionalities are using the official Maven repository.

hivemall.tools.vector.VectorAddUDF Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package hivemall.tools.vector;

import hivemall.utils.hadoop.HiveUtils;
import hivemall.utils.lang.StringUtils;

import java.util.Arrays;
import java.util.List;

import javax.annotation.Nonnegative;
import javax.annotation.Nonnull;
import javax.annotation.Nullable;

import org.apache.hadoop.hive.ql.exec.Description;
import org.apache.hadoop.hive.ql.exec.UDFArgumentException;
import org.apache.hadoop.hive.ql.exec.UDFArgumentLengthException;
import org.apache.hadoop.hive.ql.metadata.HiveException;
import org.apache.hadoop.hive.ql.udf.UDFType;
import org.apache.hadoop.hive.ql.udf.generic.GenericUDF;
import org.apache.hadoop.hive.serde2.objectinspector.ListObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspectorFactory;
import org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.primitive.PrimitiveObjectInspectorFactory;
import org.apache.hadoop.hive.serde2.objectinspector.primitive.PrimitiveObjectInspectorUtils;

@Description(name = "vector_add",
        value = "_FUNC_(array x, array y) - Perform vector ADD operation.",
        extended = "SELECT vector_add(array(1.0,2.0,3.0), array(2, 3, 4));\n" + "[3.0,5.0,7.0]")
@UDFType(deterministic = true, stateful = false)
public final class VectorAddUDF extends GenericUDF {

    private ListObjectInspector xOI, yOI;
    private PrimitiveObjectInspector xElemOI, yElemOI;
    private boolean floatingPoints;

    @Override
    public ObjectInspector initialize(ObjectInspector[] argOIs) throws UDFArgumentException {
        if (argOIs.length != 2) {
            throw new UDFArgumentLengthException("Expected 2 arguments, but got " + argOIs.length);
        }

        this.xOI = HiveUtils.asListOI(argOIs[0]);
        this.yOI = HiveUtils.asListOI(argOIs[1]);
        this.xElemOI = HiveUtils.asNumberOI(xOI.getListElementObjectInspector());
        this.yElemOI = HiveUtils.asNumberOI(yOI.getListElementObjectInspector());

        if (HiveUtils.isIntegerOI(xElemOI) && HiveUtils.isIntegerOI(yElemOI)) {
            this.floatingPoints = false;
            return ObjectInspectorFactory.getStandardListObjectInspector(
                PrimitiveObjectInspectorFactory.javaLongObjectInspector);
        } else {
            this.floatingPoints = true;
            return ObjectInspectorFactory.getStandardListObjectInspector(
                PrimitiveObjectInspectorFactory.javaDoubleObjectInspector);
        }
    }

    @Nullable
    @Override
    public List evaluate(@Nonnull DeferredObject[] args) throws HiveException {
        final Object arg0 = args[0].get();
        final Object arg1 = args[1].get();
        if (arg0 == null || arg1 == null) {
            return null;
        }

        final int xLen = xOI.getListLength(arg0);
        final int yLen = yOI.getListLength(arg1);
        if (xLen != yLen) {
            throw new HiveException(
                "vector lengths do not match. x=" + xOI.getList(arg0) + ", y=" + yOI.getList(arg1));
        }

        if (floatingPoints) {
            return evaluateDouble(arg0, arg1, xLen);
        } else {
            return evaluateLong(arg0, arg1, xLen);
        }
    }

    @Nonnull
    private List evaluateDouble(@Nonnull final Object vecX, @Nonnull final Object vecY,
            @Nonnegative final int size) {
        final Double[] arr = new Double[size];
        for (int i = 0; i < size; i++) {
            Object x = xOI.getListElement(vecX, i);
            Object y = yOI.getListElement(vecY, i);
            if (x == null || y == null) {
                continue;
            }
            double xd = PrimitiveObjectInspectorUtils.getDouble(x, xElemOI);
            double yd = PrimitiveObjectInspectorUtils.getDouble(y, yElemOI);
            double v = xd + yd;
            arr[i] = Double.valueOf(v);
        }
        return Arrays.asList(arr);
    }

    @Nonnull
    private List evaluateLong(@Nonnull final Object vecX, @Nonnull final Object vecY,
            @Nonnegative final int size) {
        final Long[] arr = new Long[size];
        for (int i = 0; i < size; i++) {
            Object x = xOI.getListElement(vecX, i);
            Object y = yOI.getListElement(vecY, i);
            if (x == null || y == null) {
                continue;
            }
            long xd = PrimitiveObjectInspectorUtils.getLong(x, xElemOI);
            long yd = PrimitiveObjectInspectorUtils.getLong(y, yElemOI);
            long v = xd + yd;
            arr[i] = Long.valueOf(v);
        }
        return Arrays.asList(arr);
    }

    @Override
    public String getDisplayString(String[] args) {
        return "vector_add(" + StringUtils.join(args, ',') + ")";
    }

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy