All Downloads are FREE. Search and download functionalities are using the official Maven repository.

cc.mallet.share.upenn.ner.FeatureWindow Maven / Gradle / Ivy

Go to download

MALLET is a Java-based package for statistical natural language processing, document classification, clustering, topic modeling, information extraction, and other machine learning applications to text.

The newest version!
package cc.mallet.share.upenn.ner;


import java.util.*;

import cc.mallet.pipe.*;
import cc.mallet.types.*;
import cc.mallet.util.*;
import gnu.trove.*;

/**
 * Adds all features of tokens in the window to the center token.
 */
public class FeatureWindow extends Pipe implements java.io.Serializable {

    int left, right;
    public FeatureWindow (int left, int right) {
        assert (left >= 0 && right >= 0);
        this.left = left;
        this.right = right;
    }

    public Instance pipe (Instance carrier) {
        TokenSequence seq = (TokenSequence)carrier.getData();
        TObjectDoubleHashMap[] original = new TObjectDoubleHashMap[seq.size()];
        for (int i=0; i=original.length) continue;
                
                Token t = seq.get(i);
                Object[] features = original[index].keys();
                for (int k=0; k




© 2015 - 2025 Weber Informatics LLC | Privacy Policy