doxygen/modules/LibtorchANNTrainer_8C_source.html

 //* This file is part of the MOOSE framework
 //* https://mooseframework.inl.gov
 //*
 //* All rights reserved, see COPYRIGHT for full restrictions
 //* https://github.com/idaholab/moose/blob/master/COPYRIGHT
 //*
 //* Licensed under LGPL 2.1, please see LICENSE for details
 //* https://www.gnu.org/licenses/lgpl-2.1.html

 #ifdef MOOSE_LIBTORCH_ENABLED

 #include "LibtorchANNTrainer.h"
 #include "LibtorchDataset.h"
 #include "Sampler.h"

 registerMooseObject("StochasticToolsApp", LibtorchANNTrainer);

 InputParameters
 LibtorchANNTrainer::validParams()
 {
   InputParameters params = SurrogateTrainer::validParams();

   params.addClassDescription("Trains a simple neural network using libtorch.");

   params.addRangeCheckedParam<unsigned int>(
       "num_batches", 1, "1<=num_batches", "Number of batches.");
   params.addRangeCheckedParam<unsigned int>(
       "num_epochs", 1, "0<num_epochs", "Number of training epochs.");
   params.addRangeCheckedParam<Real>(
       "rel_loss_tol",
       0,
       "0<=rel_loss_tol<=1",
       "The relative loss where we stop the training of the neural net.");
   params.addParam<std::vector<unsigned int>>(
       "num_neurons_per_layer", std::vector<unsigned int>(), "Number of neurons per layer.");
   params.addParam<std::vector<std::string>>(
       "activation_function",
       std::vector<std::string>({"relu"}),
       "The type of activation functions to use. It is either one value "
       "or one value per hidden layer.");
   params.addParam<std::string>(
       "nn_filename", "net.pt", "Filename used to output the neural net parameters.");
   params.addParam<bool>("read_from_file",
                         false,
                         "Switch to allow reading old trained neural nets for further training.");
   params.addParam<Real>("learning_rate", 0.001, "Learning rate (relaxation).");
   params.addRangeCheckedParam<unsigned int>(
       "print_epoch_loss",
       0,
       "0<=print_epoch_loss",
       "Epoch training loss printing. 0 - no printing, 1 - every epoch, 10 - every 10th epoch.");
   params.addParam<unsigned int>(
       "seed", 11, "Random number generator seed for stochastic optimizers.");
   params.addParam<unsigned int>(
       "max_processes", 1, "The maximum number of parallel processes that the trainer will use.");

   params.addParam<bool>(
       "standardize_input", true, "Standardize (center and scale) training inputs (x values)");
   params.addParam<bool>(
       "standardize_output", true, "Standardize (center and scale) training outputs (y values)");

   params.suppressParameter<MooseEnum>("response_type");
   return params;
 }

 LibtorchANNTrainer::LibtorchANNTrainer(const InputParameters & parameters)
   : SurrogateTrainer(parameters),
     _predictor_row(getPredictorData()),
     _num_neurons_per_layer(declareModelData<std::vector<unsigned int>>(
         "num_neurons_per_layer", getParam<std::vector<unsigned int>>("num_neurons_per_layer"))),
     _activation_function(declareModelData<std::vector<std::string>>(
         "activation_function", getParam<std::vector<std::string>>("activation_function"))),
     _nn_filename(getParam<std::string>("nn_filename")),
     _read_from_file(getParam<bool>("read_from_file")),
     _nn(declareModelData<std::shared_ptr<Moose::LibtorchArtificialNeuralNet>>("nn")),
     _standardize_input(getParam<bool>("standardize_input")),
     _standardize_output(getParam<bool>("standardize_output")),
     _input_standardizer(declareModelData<StochasticTools::Standardizer>("input_standardizer")),
     _output_standardizer(declareModelData<StochasticTools::Standardizer>("output_standardizer"))
 {
   // Fixing the RNG seed to make sure every experiment is the same.
   // Otherwise sampling / stochastic gradient descent would be different.
   torch::manual_seed(getParam<unsigned int>("seed"));

   _optim_options.optimizer_type = "adam";
   _optim_options.learning_rate = getParam<Real>("learning_rate");
   _optim_options.num_epochs = getParam<unsigned int>("num_epochs");
   _optim_options.num_batches = getParam<unsigned int>("num_batches");
   _optim_options.rel_loss_tol = getParam<Real>("rel_loss_tol");
   _optim_options.print_loss = getParam<unsigned int>("print_epoch_loss") > 0;
   _optim_options.print_epoch_loss = getParam<unsigned int>("print_epoch_loss");
   _optim_options.parallel_processes = getParam<unsigned int>("max_processes");
 }

 void
 LibtorchANNTrainer::preTrain()
 {
   // Resize to number of sample points
   _flattened_data.clear();
   _flattened_response.clear();
   _flattened_data.reserve(getLocalSampleSize() * _n_dims);
   _flattened_response.reserve(getLocalSampleSize());
 }

 void
 LibtorchANNTrainer::train()
 {
   for (auto & p : _predictor_row)
     _flattened_data.push_back(p);

   _flattened_response.push_back(*_rval);
 }

 void
 LibtorchANNTrainer::postTrain()
 {
   _communicator.allgather(_flattened_data);
   _communicator.allgather(_flattened_response);

   // Then, we create and load our Tensors
   unsigned int num_samples = _flattened_response.size();
   unsigned int num_inputs = _n_dims;

   // We create a neural net (for the definition of the net see the header file)
   _nn = std::make_shared<Moose::LibtorchArtificialNeuralNet>(
       _nn_filename, num_inputs, 1, _num_neurons_per_layer, _activation_function);

   if (_read_from_file)
     try
     {
       torch::load(_nn, _nn_filename);
       _console << "Loaded requested .pt file." << std::endl;
     }
     catch (const c10::Error & e)
     {
       mooseError("The requested pytorch file could not be loaded.\n", e.msg());
     }

   // The default data type in pytorch is float, while we use double in MOOSE.
   // Therefore, in some cases we have to convert Tensors to double.
   auto options = torch::TensorOptions().dtype(at::kDouble);
   torch::Tensor data_tensor =
       torch::from_blob(_flattened_data.data(), {num_samples, num_inputs}, options).to(at::kDouble);
   torch::Tensor response_tensor =
       torch::from_blob(_flattened_response.data(), {num_samples, 1}, options).to(at::kDouble);

   // We standardize the input/output pairs if the user requested it
   if (_standardize_input)
   {
     auto data_std_mean = torch::std_mean(data_tensor, 0);
     auto & data_std = std::get<0>(data_std_mean);
     auto & data_mean = std::get<1>(data_std_mean);

     data_tensor = (data_tensor - data_mean) / data_std;

     std::vector<Real> converted_data_mean;
     LibtorchUtils::tensorToVector(data_mean, converted_data_mean);
     std::vector<Real> converted_data_std;
     LibtorchUtils::tensorToVector(data_std, converted_data_std);
     _input_standardizer.set(converted_data_mean, converted_data_std);
   }
   else
     _input_standardizer.set(_n_dims);

   if (_standardize_output)
   {
     auto response_std_mean = torch::std_mean(response_tensor, 0);
     auto & response_std = std::get<0>(response_std_mean);
     auto & response_mean = std::get<1>(response_std_mean);

     response_tensor = (response_tensor - response_mean) / response_std;

     std::vector<Real> converted_response_mean;
     LibtorchUtils::tensorToVector(response_mean, converted_response_mean);
     std::vector<Real> converted_response_std;
     LibtorchUtils::tensorToVector(response_std, converted_response_std);
     _output_standardizer.set(converted_response_mean, converted_response_std);
   }
   else
     _output_standardizer.set(1);

   // We create a custom data set from our converted data
   Moose::LibtorchDataset my_data(data_tensor, response_tensor);

   // We create atrainer for our neral net and train it with the dataset
   Moose::LibtorchArtificialNeuralNetTrainer<> trainer(*_nn, comm());
   trainer.train(my_data, _optim_options);
 }

 #endif
Moose::LibtorchTrainingOptions::num_batches
unsigned int num_batches

LibtorchANNTrainer::LibtorchANNTrainer
LibtorchANNTrainer(const InputParameters &parameters)
Construct using input parameters.
Definition: LibtorchANNTrainer.C:66

LibtorchANNTrainer::_num_neurons_per_layer
std::vector< unsigned int > & _num_neurons_per_layer
Number of neurons within the hidden layers (the length of this vector should be the same as _num_hidd...
Definition: LibtorchANNTrainer.h:52

Moose::LibtorchTrainingOptions::print_loss
bool print_loss

libMesh::Parallel::Communicator::allgather
void allgather(const T &send_data, std::vector< T, A > &recv_data) const

LibtorchDataset.h

LibtorchANNTrainer::train
virtual void train() override
Contains processes which are executed for every sample in the training loop.
Definition: LibtorchANNTrainer.C:106

SurrogateTrainer::_rval
const Real * _rval
Response value.
Definition: SurrogateTrainer.h:125

SurrogateTrainer::_n_dims
unsigned int _n_dims
Dimension of predictor data - either _sampler.getNumberOfCols() or _pvals.size() + _pcols...
Definition: SurrogateTrainer.h:133

InputParameters::addParam
void addParam(const std::string &name, const std::initializer_list< typename T::value_type > &value, const std::string &doc_string)

LibtorchANNTrainer::_standardize_output
const bool _standardize_output
If the training output should be standardized (scaled and shifted)
Definition: LibtorchANNTrainer.h:76

LibtorchUtils::tensorToVector
void tensorToVector(torch::Tensor &tensor, std::vector< DataType > &vector)

std

libMesh::ParallelObject::comm
const Parallel::Communicator & comm() const

Moose::LibtorchArtificialNeuralNetTrainer

Moose::LibtorchDataset

libMesh::ParallelObject::_communicator
const Parallel::Communicator & _communicator

InputParameters::suppressParameter
void suppressParameter(const std::string &name)

Moose::LibtorchTrainingOptions::parallel_processes
unsigned int parallel_processes

LibtorchANNTrainer::_flattened_response
std::vector< Real > _flattened_response
The gathered response in a flattened form to be able to convert easily to torch::Tensor.
Definition: LibtorchANNTrainer.h:48

LibtorchANNTrainer::preTrain
virtual void preTrain() override
Contains processes which are executed before the training loop.
Definition: LibtorchANNTrainer.C:96

InputParameters

StochasticTools
Enum for batch type in stochastic tools MultiApp.
Definition: StochasticToolsTypes.h:13

LibtorchANNTrainer::_predictor_row
const std::vector< Real > & _predictor_row
Data from the current predictor row.
Definition: LibtorchANNTrainer.h:42

LibtorchANNTrainer::_standardize_input
const bool _standardize_input
If the training output should be standardized (scaled and shifted)
Definition: LibtorchANNTrainer.h:73

MooseEnum

LibtorchANNTrainer
Trainer responsible of fitting a neural network on predefined data.
Definition: LibtorchANNTrainer.h:23

Sampler.h

Moose::LibtorchTrainingOptions::learning_rate
Real learning_rate

LibtorchANNTrainer::_nn_filename
const std::string _nn_filename
Name of the pytorch output file.
Definition: LibtorchANNTrainer.h:59

Moose::LibtorchTrainingOptions::optimizer_type
MooseEnum optimizer_type

LibtorchANNTrainer::_optim_options
Moose::LibtorchTrainingOptions _optim_options
The struct which contains the information for the training of the neural net.
Definition: LibtorchANNTrainer.h:67

Moose::LibtorchTrainingOptions::rel_loss_tol
Real rel_loss_tol

LibtorchANNTrainer::_read_from_file
const bool _read_from_file
Switch indicating if an already existing neural net should be read from a file or not...
Definition: LibtorchANNTrainer.h:64

SurrogateTrainer::getLocalSampleSize
unsigned int getLocalSampleSize() const
Definition: SurrogateTrainer.h:107

Real
DIE A HORRIBLE DEATH HERE typedef LIBMESH_DEFAULT_SCALAR_TYPE Real

SurrogateTrainer
This is the main trainer base class.
Definition: SurrogateTrainer.h:55

LibtorchANNTrainer::_activation_function
std::vector< std::string > & _activation_function
Activation functions for each hidden layer.
Definition: LibtorchANNTrainer.h:55

LibtorchANNTrainer::_output_standardizer
StochasticTools::Standardizer & _output_standardizer
Standardizer for use with output response (y)
Definition: LibtorchANNTrainer.h:82

LibtorchANNTrainer::postTrain
virtual void postTrain() override
Contains processes which are executed after the training loop.
Definition: LibtorchANNTrainer.C:115

StochasticTools::Standardizer::set
void set(const Real &n)
Methods for setting mean and standard deviation directly Sets mean=0, std=1 for n variables...
Definition: Standardizer.C:16

registerMooseObject
registerMooseObject("StochasticToolsApp", LibtorchANNTrainer)

GeneralUserObject::mooseError
void mooseError(Args &&... args) const

Moose::LibtorchArtificialNeuralNetTrainer::train
virtual void train(LibtorchDataset &dataset, const LibtorchTrainingOptions &options)

InputParameters::addClassDescription
void addClassDescription(const std::string &doc_string)

LibtorchANNTrainer::_nn
std::shared_ptr< Moose::LibtorchArtificialNeuralNet > & _nn
Pointer to the neural net object (initialized as null)
Definition: LibtorchANNTrainer.h:70

InputParameters::addRangeCheckedParam
void addRangeCheckedParam(const std::string &name, const T &value, const std::string &parsed_function, const std::string &doc_string)

Moose

GeneralUserObject::_console
const ConsoleStream _console

Moose::LibtorchTrainingOptions::num_epochs
unsigned int num_epochs

SurrogateTrainer::validParams
static InputParameters validParams()
Definition: SurrogateTrainer.C:34

LibtorchANNTrainer::_input_standardizer
StochasticTools::Standardizer & _input_standardizer
Standardizer for use with input (x)
Definition: LibtorchANNTrainer.h:79

LibtorchANNTrainer::_flattened_data
std::vector< Real > _flattened_data
The gathered data in a flattened form to be able to convert easily to torch::Tensor.
Definition: LibtorchANNTrainer.h:45

LibtorchANNTrainer::validParams
static InputParameters validParams()
Definition: LibtorchANNTrainer.C:19

int
void ErrorVector unsigned int

Moose::LibtorchTrainingOptions::print_epoch_loss
unsigned int print_epoch_loss

LibtorchANNTrainer.h