org.apache.mahout.vectorizer.encoders.ContinuousValueEncoder Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of mahout-mr Show documentation
Show all versions of mahout-mr Show documentation
Scalable machine learning libraries
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.mahout.vectorizer.encoders;
import com.google.common.base.Charsets;
import org.apache.mahout.math.Vector;
/**
* Continuous values are stored in fixed randomized location in the feature vector.
*/
public class ContinuousValueEncoder extends CachingValueEncoder {
public ContinuousValueEncoder(String name) {
super(name, CONTINUOUS_VALUE_HASH_SEED);
}
/**
* Adds a value to a vector.
*
* @param originalForm The original form of the value as a string.
* @param data The vector to which the value should be added.
*/
@Override
public void addToVector(byte[] originalForm, double weight, Vector data) {
int probes = getProbes();
String name = getName();
for (int i = 0; i < probes; i++) {
int n = hashForProbe(originalForm, data.size(), name, i);
if (isTraceEnabled()) {
trace((String) null, n);
}
data.set(n, data.get(n) + getWeight(originalForm,weight));
}
}
@Override
protected double getWeight(byte[] originalForm, double w) {
if (originalForm == null) {
return w;
}
return w * Double.parseDouble(new String(originalForm, Charsets.UTF_8));
}
/**
* Converts a value into a form that would help a human understand the internals of how the value
* is being interpreted. For text-like things, this is likely to be a list of the terms found with
* associated weights (if any).
*
* @param originalForm The original form of the value as a string.
* @return A string that a human can read.
*/
@Override
public String asString(String originalForm) {
return getName() + ':' + originalForm;
}
@Override
protected int getSeed() {
return CONTINUOUS_VALUE_HASH_SEED;
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy