All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.deeplearning4j.earlystopping.saver.LocalFileModelSaver Maven / Gradle / Ivy

There is a newer version: 1.0.0-M2.1
Show newest version
package org.deeplearning4j.earlystopping.saver;

import org.apache.commons.io.FilenameUtils;
import org.deeplearning4j.earlystopping.EarlyStoppingModelSaver;
import org.deeplearning4j.nn.multilayer.MultiLayerNetwork;
import org.deeplearning4j.util.ModelSerializer;

import java.io.File;
import java.io.IOException;
import java.nio.charset.Charset;

/** Save the best (and latest/most recent) models learned during early stopping training to the local file system.
* Instances of this class will save 3 files for best (and optionally, latest) models:
* (a) The network configuration: bestModelConf.json
* (b) The network parameters: bestModelParams.bin
* (c) The network updater: bestModelUpdater.bin
*
* NOTE: The model updater is an object that contains the internal state for training features such as AdaGrad, Momentum * and RMSProp.
* The updater is not required to use the network at test time; it is saved in case further training is required. * Without saving the updater, any further training would result in the updater being recreated, without the benefit * of the history/internal state. This could negatively impact training performance after loading the network. * * @author Alex Black */ public class LocalFileModelSaver implements EarlyStoppingModelSaver { private static final String bestFileName = "bestModel.bin"; private static final String latestFileName = "latestModel.bin"; private String directory; private Charset encoding; /**Constructor that uses default character set for configuration (json) encoding * @param directory Directory to save networks */ public LocalFileModelSaver(String directory) { this(directory, Charset.defaultCharset()); } /** * @param directory Directory to save networks * @param encoding Character encoding for configuration (json) */ public LocalFileModelSaver(String directory, Charset encoding) { this.directory = directory; this.encoding = encoding; File dir = new File(directory); if (!dir.exists()) { dir.mkdirs(); } } @Override public void saveBestModel(MultiLayerNetwork net, double score) throws IOException { String confOut = FilenameUtils.concat(directory, bestFileName); save(net, confOut); } @Override public void saveLatestModel(MultiLayerNetwork net, double score) throws IOException { String confOut = FilenameUtils.concat(directory, latestFileName); save(net, confOut); } @Override public MultiLayerNetwork getBestModel() throws IOException { String confOut = FilenameUtils.concat(directory, bestFileName); return load(confOut); } @Override public MultiLayerNetwork getLatestModel() throws IOException { String confOut = FilenameUtils.concat(directory, latestFileName); return load(confOut); } private void save(MultiLayerNetwork net, String modelName) throws IOException { ModelSerializer.writeModel(net, modelName, true); } private MultiLayerNetwork load(String modelName) throws IOException { MultiLayerNetwork net = ModelSerializer.restoreMultiLayerNetwork(modelName); return net; } @Override public String toString() { return "LocalFileModelSaver(dir=" + directory + ")"; } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy