com.simiacryptus.text.SimpleModel Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of tf-gpt-2 Show documentation
Show all versions of tf-gpt-2 Show documentation
GPT-2 Text Prediction via Tensorflow Java API
/*
* Copyright (c) 2019 by Andrew Charneski.
*
* The author licenses this file to you under the
* Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance
* with the License. You may obtain a copy
* of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package com.simiacryptus.text;
import com.simiacryptus.text.gpt2.GPT2Codec;
import org.tensorflow.Tensor;
import java.util.Arrays;
import java.util.List;
import java.util.Map;
import java.util.function.BiFunction;
import java.util.stream.Collectors;
public class SimpleModel implements LanguageCodeModel {
private final float[] result;
public SimpleModel(float... result) {
this.result = Arrays.copyOf(result, result.length);
}
public static SimpleModel build(GPT2Codec codec, String text) {
List encode = codec.encode(text);
Map counts = encode.stream().collect(Collectors.groupingBy(x -> x, Collectors.counting()));
float[] result = new float[codec.getVocabSize()];
for (int i = 0; i < result.length; i++) {
result[i] = ((float) counts.getOrDefault(i, 0l)) / encode.size();
}
return new SimpleModel(result);
}
@Override
public LanguageCodeModel copy() {
return new SimpleModel(result);
}
@Override
public LanguageCodeModel clear() {
return this;
}
@Override
public float[] eval(int data_X) {
return Arrays.copyOf(result, result.length);
}
@Override
public BiFunction getFilterFn() {
return null;
}
@Override
public LanguageCodeModel setFilterFn(BiFunction filterFn) {
return this;
}
@Override
public Tensor> state() {
return null;
}
public LanguageCodeModel setTemperature(double temperature) {
return this;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy