All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.deeplearning4j.arbiter.conf.updater.AdaMaxSpace Maven / Gradle / Ivy

There is a newer version: 1.0.0-beta7
Show newest version
package org.deeplearning4j.arbiter.conf.updater;

import lombok.Data;
import lombok.EqualsAndHashCode;
import org.deeplearning4j.arbiter.optimize.api.ParameterSpace;
import org.nd4j.linalg.learning.config.AdaMax;
import org.nd4j.linalg.learning.config.IUpdater;
import org.nd4j.linalg.schedule.ISchedule;
import org.nd4j.shade.jackson.annotation.JsonProperty;

@Data
@EqualsAndHashCode(callSuper = false)
public class AdaMaxSpace extends BaseUpdaterSpace {

    private ParameterSpace learningRate;
    private ParameterSpace learningRateSchedule;
    private ParameterSpace beta1;
    private ParameterSpace beta2;
    private ParameterSpace epsilon;

    public AdaMaxSpace(ParameterSpace learningRate) {
        this(learningRate, null, null, null);
    }

    public AdaMaxSpace(ParameterSpace learningRate, ParameterSpace beta1,
                       ParameterSpace beta2, ParameterSpace epsilon) {
        this(learningRate, null, beta1, beta2, epsilon);
    }

    public AdaMaxSpace(@JsonProperty("learningRate") ParameterSpace learningRate,
                       @JsonProperty("learningRateSchedule") ParameterSpace learningRateSchedule,
                       @JsonProperty("beta1") ParameterSpace beta1,
                       @JsonProperty("beta2") ParameterSpace beta2,
                       @JsonProperty("epsilon") ParameterSpace epsilon){
        this.learningRate = learningRate;
        this.learningRateSchedule = learningRateSchedule;
        this.beta1 = beta1;
        this.beta2 = beta2;
        this.epsilon = epsilon;
    }

    public static AdaMaxSpace withLR(ParameterSpace lr){
        return new AdaMaxSpace(lr, null, null, null, null);
    }

    public static AdaMaxSpace withLRSchedule(ParameterSpace lrSchedule){
        return new AdaMaxSpace(null, lrSchedule, null, null, null);
    }

    @Override
    public IUpdater getValue(double[] parameterValues) {
        double lr = learningRate == null ? AdaMax.DEFAULT_ADAMAX_LEARNING_RATE : learningRate.getValue(parameterValues);
        ISchedule lrS = learningRateSchedule == null ? null : learningRateSchedule.getValue(parameterValues);
        double b1 = beta1 == null ? AdaMax.DEFAULT_ADAMAX_LEARNING_RATE : beta1.getValue(parameterValues);
        double b2 = beta2 == null ? AdaMax.DEFAULT_ADAMAX_LEARNING_RATE : beta2.getValue(parameterValues);
        double eps = epsilon == null ? AdaMax.DEFAULT_ADAMAX_LEARNING_RATE : epsilon.getValue(parameterValues);
        if(lrS == null){
            return new AdaMax(lr, b1, b2, eps);
        } else {
            AdaMax a = new AdaMax(lrS);
            a.setBeta1(b1);
            a.setBeta2(b2);
            a.setEpsilon(eps);
            return a;
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy