All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.simiacryptus.text.SimpleModel Maven / Gradle / Ivy

There is a newer version: 2.1.0
Show newest version
/*
 * Copyright (c) 2019 by Andrew Charneski.
 *
 * The author licenses this file to you under the
 * Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance
 * with the License.  You may obtain a copy
 * of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package com.simiacryptus.text;

import com.simiacryptus.text.gpt2.GPT2Codec;
import org.tensorflow.Tensor;

import java.util.Arrays;
import java.util.List;
import java.util.Map;
import java.util.function.BiFunction;
import java.util.stream.Collectors;

public class SimpleModel implements LanguageCodeModel {

  private final float[] result;

  public SimpleModel(float... result) {
    this.result = Arrays.copyOf(result, result.length);
  }

  public static SimpleModel build(GPT2Codec codec, String text) {
    List encode = codec.encode(text);
    Map counts = encode.stream().collect(Collectors.groupingBy(x -> x, Collectors.counting()));
    float[] result = new float[codec.getVocabSize()];
    for (int i = 0; i < result.length; i++) {
      result[i] = ((float) counts.getOrDefault(i, 0l)) / encode.size();
    }
    return new SimpleModel(result);
  }

  @Override
  public LanguageCodeModel copy() {
    return new SimpleModel(result);
  }

  @Override
  public LanguageCodeModel clear() {
    return this;
  }

  @Override
  public float[] eval(int data_X) {
    return Arrays.copyOf(result, result.length);
  }

  @Override
  public BiFunction getFilterFn() {
    return null;
  }

  @Override
  public LanguageCodeModel setFilterFn(BiFunction filterFn) {
    return this;
  }

  @Override
  public Tensor state() {
    return null;
  }

  public LanguageCodeModel setTemperature(double temperature) {
    return this;
  }

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy