com.simiacryptus.mindseye.layers.java.GaussianActivationLayer Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of mindseye-java Show documentation
Show all versions of mindseye-java Show documentation
Pure Java Neural Networks Components
/*
* Copyright (c) 2019 by Andrew Charneski.
*
* The author licenses this file to you under the
* Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance
* with the License. You may obtain a copy
* of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package com.simiacryptus.mindseye.layers.java;
import com.google.gson.JsonObject;
import com.simiacryptus.mindseye.lang.DataSerializer;
import javax.annotation.Nonnull;
import java.util.Map;
/**
* This activation key uses the unit gaussian curve. The maximal response, at x=0, is y=1. At +/- infinity, the value
* is zero.
*/
@SuppressWarnings("serial")
public final class GaussianActivationLayer extends SimpleActivationLayer {
private static final double MIN_X = -20;
private static final double MAX_X = -GaussianActivationLayer.MIN_X;
private static final double MAX_F = Math.exp(GaussianActivationLayer.MAX_X);
private static final double MIN_F = Math.exp(GaussianActivationLayer.MIN_X);
private final double mean;
private final double stddev;
/**
* Instantiates a new Gaussian activation key.
*
* @param mean the mean
* @param stddev the stddev
*/
public GaussianActivationLayer(final double mean, final double stddev) {
this.mean = mean;
this.stddev = stddev;
}
/**
* Instantiates a new Gaussian activation key.
*
* @param id the id
*/
protected GaussianActivationLayer(@Nonnull final JsonObject id) {
super(id);
mean = id.get("mean").getAsDouble();
stddev = id.get("stddev").getAsDouble();
}
/**
* From json gaussian activation key.
*
* @param json the json
* @param rs the rs
* @return the gaussian activation key
*/
public static GaussianActivationLayer fromJson(@Nonnull final JsonObject json, Map rs) {
return new GaussianActivationLayer(json);
}
@Override
protected final void eval(final double x, final double[] results) {
final double minDeriv = 0;
final double c = x - mean;
final double s2 = stddev * stddev;
final double s3 = stddev * s2;
final double k = Math.sqrt(2 * Math.PI);
final double e = exp(-(c * c / (2 * s2)));
double d = e * c / (s3 * k);
final double f = e / (stddev * k);
// double d = f * (1 - f);
if (!Double.isFinite(d) || Math.abs(d) < minDeriv) {
d = minDeriv * Math.signum(d);
}
assert Double.isFinite(d);
assert minDeriv <= Math.abs(d);
results[0] = f;
results[1] = -d;
}
private double exp(final double x) {
if (x < GaussianActivationLayer.MIN_X) {
return GaussianActivationLayer.MIN_F;
}
if (x > GaussianActivationLayer.MAX_X) {
return GaussianActivationLayer.MAX_F;
}
return Math.exp(x);
}
@Nonnull
@Override
public JsonObject getJson(Map resources, DataSerializer dataSerializer) {
@Nonnull final JsonObject json = super.getJsonStub();
json.addProperty("mean", mean);
json.addProperty("stddev", stddev);
return json;
}
}