org.deeplearning4j.nn.api.ParamInitializer Maven / Gradle / Ivy
/*-
*
* * Copyright 2015 Skymind,Inc.
* *
* * Licensed under the Apache License, Version 2.0 (the "License");
* * you may not use this file except in compliance with the License.
* * You may obtain a copy of the License at
* *
* * http://www.apache.org/licenses/LICENSE-2.0
* *
* * Unless required by applicable law or agreed to in writing, software
* * distributed under the License is distributed on an "AS IS" BASIS,
* * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* * See the License for the specific language governing permissions and
* * limitations under the License.
*
*/
package org.deeplearning4j.nn.api;
import org.deeplearning4j.nn.conf.NeuralNetConfiguration;
import org.deeplearning4j.nn.conf.layers.*;
import org.nd4j.linalg.api.ndarray.INDArray;
import java.util.Map;
/**
* Param initializer for a layer
*
* @author Adam Gibson
*/
public interface ParamInitializer {
int numParams(NeuralNetConfiguration conf);
int numParams(org.deeplearning4j.nn.conf.layers.Layer layer);
/**
* Initialize the parameters
*
* @param conf the configuration
* @param paramsView a view of the full network (backprop) parameters
* @param initializeParams if true: initialize the parameters according to the configuration. If false: don't modify the
* values in the paramsView array (but do select out the appropriate subset, reshape etc as required)
* @return Map of parameters keyed by type (view of the 'paramsView' array)
*/
Map init(NeuralNetConfiguration conf, INDArray paramsView, boolean initializeParams);
/**
* Return a map of gradients (in their standard non-flattened representation), taken from the flattened (row vector) gradientView array.
* The idea is that operates in exactly the same way as the the paramsView does in {@link #init(Map, NeuralNetConfiguration, INDArray)};
* thus the position in the view (and, the array orders) must match those of the parameters
*
* @param conf Configuration
* @param gradientView The flattened gradients array, as a view of the larger array
* @return A map containing an array by parameter type, that is a view of the full network gradients array
*/
Map getGradientsFromFlattened(NeuralNetConfiguration conf, INDArray gradientView);
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy