All Downloads are FREE. Search and download functionalities are using the official Maven repository.

opennlp.tools.util.featuregen.WordClusterFeatureGeneratorFactory Maven / Gradle / Ivy

There is a newer version: 2.5.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package opennlp.tools.util.featuregen;

import java.util.HashMap;
import java.util.Map;

import org.w3c.dom.Element;

import opennlp.tools.util.InvalidFormatException;
import opennlp.tools.util.model.ArtifactSerializer;

/**
 * Defines a word cluster generator factory; it reads an element containing
 * 'w2vwordcluster' as a tag name; these clusters are typically produced by
 * word2vec or clark pos induction systems.
 */
public class WordClusterFeatureGeneratorFactory
    extends GeneratorFactory.AbstractXmlFeatureGeneratorFactory
    implements GeneratorFactory.XmlFeatureGeneratorFactory {

  public WordClusterFeatureGeneratorFactory() {
    super();
  }

  @Deprecated // TODO: (OPENNLP-1174) just remove when back-compat is no longer needed
  public AdaptiveFeatureGenerator create(Element generatorElement,
             FeatureGeneratorResourceProvider resourceManager) throws InvalidFormatException {

    String dictResourceKey = generatorElement.getAttribute("dict");
    boolean lowerCaseDictionary = "true".equals(generatorElement.getAttribute("lowerCase"));

    Object dictResource = resourceManager.getResource(dictResourceKey);


    if (!(dictResource instanceof WordClusterDictionary)) {
      throw new InvalidFormatException("Not a WordClusterDictionary resource for key: "
          + dictResourceKey);
    }

    return new WordClusterFeatureGenerator((WordClusterDictionary) dictResource,
        dictResourceKey, lowerCaseDictionary);
  }

  @Deprecated // TODO: (OPENNLP-1174) just remove when back-compat is no longer needed
  static void register(Map factoryMap) {
    factoryMap.put("wordcluster", new WordClusterFeatureGeneratorFactory());
  }

  @Override
  public AdaptiveFeatureGenerator create() throws InvalidFormatException {
    // if resourceManager is null, we don't instantiate
    if (resourceManager == null)
      return null;

    String dictResourceKey = getStr("dict");
    boolean lowerCaseDictionary = getBool("lowerCase");
    Object dictResource = resourceManager.getResource(dictResourceKey);
    if (!(dictResource instanceof WordClusterDictionary)) {
      throw new InvalidFormatException("Not a WordClusterDictionary resource for key: "
          + dictResourceKey);
    }

    return new WordClusterFeatureGenerator((WordClusterDictionary) dictResource,
        dictResourceKey, lowerCaseDictionary);
  }

  @Override
  public Map> getArtifactSerializerMapping() throws InvalidFormatException {
    Map> mapping = new HashMap<>();
    mapping.put(getStr("dict"), new WordClusterDictionary.WordClusterDictionarySerializer());
    return mapping;
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy