All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.simiacryptus.text.MinEntropyWrapper Maven / Gradle / Ivy

There is a newer version: 2.1.0
Show newest version
/*
 * Copyright (c) 2019 by Andrew Charneski.
 *
 * The author licenses this file to you under the
 * Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance
 * with the License.  You may obtain a copy
 * of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package com.simiacryptus.text;

import com.simiacryptus.ref.wrappers.RefString;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import javax.annotation.Nonnull;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.stream.DoubleStream;
import java.util.stream.IntStream;

public class MinEntropyWrapper extends ModelWrapper {
  protected static final Logger logger = LoggerFactory.getLogger(MinEntropyWrapper.class);
  private final ArrayList entropyHistory = new ArrayList<>();
  private double value;

  public MinEntropyWrapper(double value, LanguageCodeModel child) {
    super(child);
    this.value = value;
  }

  public double getValue() {
    return value;
  }

  public void setValue(double value) {
    this.value = value;
  }

  public static double entropy(@Nonnull float[] floats) {
    return IntStream.range(0, floats.length).mapToDouble(i -> {
      float p = floats[i];
      return p <= 0 ? 0 : -p * Math.log(p);
    }).sum() / Math.log(2);
  }

  @Nonnull
  public static float[] powCopy(@Nonnull float[] floats, double value) {
    float[] copy = Arrays.copyOf(floats, floats.length);
    pow(copy, value);
    return copy;
  }

  public static void pow(@Nonnull float[] floats, double value) {
    for (int i = 0; i < floats.length; i++) {
      floats[i] = (float) Math.pow(floats[i], value);
    }
  }

  @Override
  public float[] eval(int data_X) {
    LanguageCodeModel child = children[0];
    float[] floats = child.eval(data_X);
    double entropy = entropy(floats);
    entropyHistory.add(entropy);
    double[] schedule = DoubleStream.iterate(1.0, x -> x * 0.9).limit(1000).toArray();
    for (int i = 0; i < schedule.length; i++) {
      float[] copy = powCopy(floats, schedule[i]);
      SumModel.normalize(copy);
      if (entropy(copy) > value) {
        floats = copy;
        break;
      }
    }
    logger.debug(RefString.format("Entropy = %s => %s", entropy, entropy(floats)));
    //SumModel.normalize(floats);
    return floats;
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy