doc/nnet-training_8h_source.html

 // nnet3/nnet-training.h

 // Copyright    2015  Johns Hopkins University (author: Daniel Povey)
 //              2016  Xiaohui Zhang

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_NNET3_NNET_TRAINING_H_
 #define KALDI_NNET3_NNET_TRAINING_H_

 #include "nnet3/nnet-example.h"
 #include "nnet3/nnet-computation.h"
 #include "nnet3/nnet-compute.h"
 #include "nnet3/nnet-optimize.h"
 #include "nnet3/nnet-example-utils.h"
 #include "nnet3/nnet-utils.h"

 namespace kaldi {
 namespace nnet3 {

 struct NnetTrainerOptions {
   bool zero_component_stats;
   bool store_component_stats;
   int32 print_interval;
   bool debug_computation;
   BaseFloat momentum;
   BaseFloat l2_regularize_factor;
   BaseFloat backstitch_training_scale;
   int32 backstitch_training_interval;
   BaseFloat batchnorm_stats_scale;
   std::string read_cache;
   std::string write_cache;
   bool binary_write_cache;
   BaseFloat max_param_change;
   NnetOptimizeOptions optimize_config;
   NnetComputeOptions compute_config;
   CachingOptimizingCompilerOptions compiler_config;
   NnetTrainerOptions():
       zero_component_stats(true),
       store_component_stats(true),
       print_interval(100),
       debug_computation(false),
       momentum(0.0),
       l2_regularize_factor(1.0),
       backstitch_training_scale(0.0),
       backstitch_training_interval(1),
       batchnorm_stats_scale(0.8),
       binary_write_cache(true),
       max_param_change(2.0) { }
   void Register(OptionsItf *opts) {
     opts->Register("store-component-stats", &store_component_stats,
                    "If true, store activations and derivatives for nonlinear "
                    "components during training.");
     opts->Register("zero-component-stats", &zero_component_stats,
                    "If both this and --store-component-stats are true, then "
                    "the component stats are zeroed before training.");
     opts->Register("print-interval", &print_interval, "Interval (measured in "
                    "minibatches) after which we print out objective function "
                    "during training\n");
     opts->Register("max-param-change", &max_param_change, "The maximum change in "
                    "parameters allowed per minibatch, measured in Euclidean norm "
                    "over the entire model (change will be clipped to this value)");
     opts->Register("momentum", &momentum, "Momentum constant to apply during "
                    "training (help stabilize update).  e.g. 0.9.  Note: we "
                    "automatically multiply the learning rate by (1-momenum) "
                    "so that the 'effective' learning rate is the same as "
                    "before (because momentum would normally increase the "
                    "effective learning rate by 1/(1-momentum))");
     opts->Register("l2-regularize-factor", &l2_regularize_factor, "Factor that "
                    "affects the strength of l2 regularization on model "
                    "parameters.  The primary way to specify this type of "
                    "l2 regularization is via the 'l2-regularize'"
                    "configuration value at the config-file level. "
                    " --l2-regularize-factor will be multiplied by the component-level "
                    "l2-regularize values and can be used to correct for effects "
                    "related to parallelization by model averaging.");
     opts->Register("batchnorm-stats-scale", &batchnorm_stats_scale,
                    "Factor by which we scale down the accumulated stats of batchnorm "
                    "layers after processing each minibatch.  Ensure that the final "
                    "model we write out has batchnorm stats that are fairly fresh.");
     opts->Register("backstitch-training-scale", &backstitch_training_scale,
                    "backstitch training factor. "
                    "if 0 then in the normal training mode. It is referred as "
                    "'\\alpha' in our publications.");
     opts->Register("backstitch-training-interval",
                    &backstitch_training_interval,
                    "do backstitch training with the specified interval of "
                    "minibatches. It is referred as 'n' in our publications.");
     opts->Register("read-cache", &read_cache, "The location from which to read "
                    "the cached computation.");
     opts->Register("write-cache", &write_cache, "The location to which to write "
                    "the cached computation.");
     opts->Register("binary-write-cache", &binary_write_cache, "Write "
                    "computation cache in binary mode");

     // register the optimization options with the prefix "optimization".
     ParseOptions optimization_opts("optimization", opts);
     optimize_config.Register(&optimization_opts);
     ParseOptions compiler_opts("compiler", opts);
     compiler_config.Register(&compiler_opts);
     // register the compute options with the prefix "computation".
     ParseOptions compute_opts("computation", opts);
     compute_config.Register(&compute_opts);
   }
 };

 // This struct is used in multiple nnet training classes for keeping
 // track of objective function values.
 // Also see struct AccuracyInfo, in nnet-diagnostics.h.
 struct ObjectiveFunctionInfo {
   int32 current_phase;
   int32 minibatches_this_phase; // The number of minibatches' worth of stats that
                                 // we accumulated in the phase numbered
                                 // 'current_phase'.
   double tot_weight;
   double tot_objf;
   double tot_aux_objf;  // An 'auxiliary' objective function that is optional-
                         // may be used when things like regularization are being
                         // used.

   double tot_weight_this_phase;
   double tot_objf_this_phase;
   double tot_aux_objf_this_phase;

   ObjectiveFunctionInfo():
       current_phase(0),
       minibatches_this_phase(0),
       tot_weight(0.0), tot_objf(0.0), tot_aux_objf(0.0),
       tot_weight_this_phase(0.0), tot_objf_this_phase(0.0),
       tot_aux_objf_this_phase(0.0) { }

   // This function updates the stats and, if the phase has just changed,
   // prints a message indicating progress.  The phase equals
   // minibatch_counter / minibatches_per_phase.  Its only function is to
   // control how frequently we print logging messages.
   void UpdateStats(const std::string &output_name,
                    int32 minibatches_per_phase,
                    int32 minibatch_counter,
                    BaseFloat this_minibatch_weight,
                    BaseFloat this_minibatch_tot_objf,
                    BaseFloat this_minibatch_tot_aux_objf = 0.0);

   // Prints stats for the current phase.
   // Note: 'phase' will normally be this->current_phase + 1, but may under
   // unusual circumstances (e.g. multilingual training, where not all outputs
   // are seen on all minibatches) be larger than that.
   void PrintStatsForThisPhase(const std::string &output_name,
                               int32 minibatches_per_phase,
                               int32 phase) const;
   // Prints total stats, and returns true if total stats' weight was nonzero.
   bool PrintTotalStats(const std::string &output_name) const;
 };


 class NnetTrainer {
  public:
   NnetTrainer(const NnetTrainerOptions &config,
               Nnet *nnet);

   // train on one minibatch.
   void Train(const NnetExample &eg);

   // Prints out the final stats, and return true if there was a nonzero count.
   bool PrintTotalStats() const;

   ~NnetTrainer();
  private:
   // The internal function for doing one step of conventional SGD training.
   void TrainInternal(const NnetExample &eg,
                      const NnetComputation &computation);

   // The internal function for doing one step of backstitch training. Depending
   // on whether is_backstitch_step1 is true, It could be either the first
   // (backward) step, or the second (forward) step of backstitch.
   void TrainInternalBackstitch(const NnetExample &eg,
                                const NnetComputation &computation,
                                bool is_backstitch_step1);

   void ProcessOutputs(bool is_backstitch_step2, const NnetExample &eg,
                       NnetComputer *computer);

   const NnetTrainerOptions config_;
   Nnet *nnet_;
   Nnet *delta_nnet_;  // nnet representing parameter-change for this minibatch
                       // (or, when using momentum, the moving weighted average
                       // of this).
   CachingOptimizingCompiler compiler_;

   // This code supports multiple output layers, even though in the
   // normal case there will be just one output layer named "output".
   // So we store the objective functions per output layer.
   int32 num_minibatches_processed_;

   // stats for max-change.
   MaxChangeStats max_change_stats_;

   unordered_map<std::string, ObjectiveFunctionInfo, StringHasher> objf_info_;

   // This value is used in backstitch training when we need to ensure
   // consistent dropout masks.  It's set to a value derived from rand()
   // when the class is initialized.
   int32 srand_seed_;
 };

 void ComputeObjectiveFunction(const GeneralMatrix &supervision,
                               ObjectiveType objective_type,
                               const std::string &output_name,
                               bool supply_deriv,
                               NnetComputer *computer,
                               BaseFloat *tot_weight,
                               BaseFloat *tot_objf);


 } // namespace nnet3
 } // namespace kaldi

 #endif // KALDI_NNET3_NNET_TRAINING_H_
kaldi::nnet3::NnetExample
NnetExample is the input data and corresponding label (or labels) for one or more frames of input...
Definition: nnet-example.h:111

nnet-example.h

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

nnet-compute.h

kaldi::nnet3::NnetOptimizeOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-optimize.h:84

kaldi::GeneralMatrix
This class is a wrapper that enables you to store a matrix in one of three forms: either as a Matrix<...
Definition: sparse-matrix.h:282

kaldi::nnet3::NnetTrainer::nnet_
Nnet * nnet_
Definition: nnet-training.h:208

kaldi::nnet3::ObjectiveFunctionInfo::ObjectiveFunctionInfo
ObjectiveFunctionInfo()
Definition: nnet-training.h:138

kaldi::nnet3::NnetTrainer::delta_nnet_
Nnet * delta_nnet_
Definition: nnet-training.h:209

kaldi::nnet3::ObjectiveFunctionInfo::tot_aux_objf_this_phase
double tot_aux_objf_this_phase
Definition: nnet-training.h:136

kaldi::nnet3::ComputeObjectiveFunction
void ComputeObjectiveFunction(const GeneralMatrix &supervision, ObjectiveType objective_type, const std::string &output_name, bool supply_deriv, NnetComputer *computer, BaseFloat *tot_weight, BaseFloat *tot_objf)
This function computes the objective function, and if supply_deriv = true, supplies its derivative to...
Definition: nnet-training.cc:339

kaldi::nnet3::NnetTrainerOptions::optimize_config
NnetOptimizeOptions optimize_config
Definition: nnet-training.h:48

kaldi::nnet3::CachingOptimizingCompiler
This class enables you to do the compilation and optimization in one call, and also ensures that if t...
Definition: nnet-optimize.h:219

kaldi::nnet3::ObjectiveFunctionInfo::tot_objf
double tot_objf
Definition: nnet-training.h:129

kaldi::nnet3::NnetTrainerOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-training.h:63

kaldi::nnet3::CachingOptimizingCompilerOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-optimize.h:200

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::NnetTrainerOptions::l2_regularize_factor
BaseFloat l2_regularize_factor
Definition: nnet-training.h:40

kaldi::nnet3::ObjectiveFunctionInfo::tot_aux_objf
double tot_aux_objf
Definition: nnet-training.h:130

kaldi::nnet3::NnetTrainerOptions::compiler_config
CachingOptimizingCompilerOptions compiler_config
Definition: nnet-training.h:50

kaldi::nnet3::NnetTrainerOptions::momentum
BaseFloat momentum
Definition: nnet-training.h:39

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi::nnet3::NnetComputeOptions
Definition: nnet-compute.h:39

kaldi::nnet3::NnetTrainerOptions::backstitch_training_interval
int32 backstitch_training_interval
Definition: nnet-training.h:42

nnet-utils.h
This file contains some miscellaneous functions dealing with class Nnet.

nnet-computation.h
The two main classes defined in this header are struct ComputationRequest, which basically defines a ...

kaldi::nnet3::CachingOptimizingCompilerOptions
Definition: nnet-optimize.h:192

kaldi::nnet3::NnetTrainerOptions::print_interval
int32 print_interval
Definition: nnet-training.h:37

kaldi::nnet3::NnetTrainerOptions::NnetTrainerOptions
NnetTrainerOptions()
Definition: nnet-training.h:51

nnet-optimize.h

kaldi::nnet3::NnetTrainer::max_change_stats_
MaxChangeStats max_change_stats_
Definition: nnet-training.h:220

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

float

kaldi::nnet3::NnetTrainerOptions::store_component_stats
bool store_component_stats
Definition: nnet-training.h:36

kaldi::nnet3::NnetTrainer::objf_info_
unordered_map< std::string, ObjectiveFunctionInfo, StringHasher > objf_info_
Definition: nnet-training.h:222

kaldi::nnet3::NnetOptimizeOptions
Definition: nnet-optimize.h:35

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

nnet-example-utils.h

kaldi::nnet3::NnetTrainer::compiler_
CachingOptimizingCompiler compiler_
Definition: nnet-training.h:212

kaldi::nnet3::ObjectiveFunctionInfo::minibatches_this_phase
int32 minibatches_this_phase
Definition: nnet-training.h:125

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::nnet3::NnetTrainer::config_
const NnetTrainerOptions config_
Definition: nnet-training.h:207

kaldi::nnet3::NnetTrainerOptions::write_cache
std::string write_cache
Definition: nnet-training.h:45

kaldi::nnet3::NnetTrainerOptions::max_param_change
BaseFloat max_param_change
Definition: nnet-training.h:47

kaldi::nnet3::NnetTrainer::srand_seed_
int32 srand_seed_
Definition: nnet-training.h:227

kaldi::nnet3::NnetComputeOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-compute.h:42

kaldi::nnet3::ObjectiveType
ObjectiveType
This enum is for a kind of annotation we associate with output nodes of the network; it&#39;s for the con...
Definition: nnet-nnet.h:52

kaldi::nnet3::ObjectiveFunctionInfo
Definition: nnet-training.h:123

kaldi::nnet3::ObjectiveFunctionInfo::tot_objf_this_phase
double tot_objf_this_phase
Definition: nnet-training.h:135

kaldi::nnet3::MaxChangeStats
Definition: nnet-utils.h:540

kaldi::nnet3::NnetComputer
class NnetComputer is responsible for executing the computation described in the "computation" object...
Definition: nnet-compute.h:59

kaldi::nnet3::NnetComputation
Definition: nnet-computation.h:303

kaldi::nnet3::NnetTrainerOptions::read_cache
std::string read_cache
Definition: nnet-training.h:44

kaldi::nnet3::NnetTrainerOptions::debug_computation
bool debug_computation
Definition: nnet-training.h:38

kaldi::nnet3::NnetTrainerOptions
Definition: nnet-training.h:34

kaldi::nnet3::ObjectiveFunctionInfo::current_phase
int32 current_phase
Definition: nnet-training.h:124

kaldi::nnet3::ObjectiveFunctionInfo::tot_weight_this_phase
double tot_weight_this_phase
Definition: nnet-training.h:134

kaldi::nnet3::NnetTrainerOptions::binary_write_cache
bool binary_write_cache
Definition: nnet-training.h:46

kaldi::nnet3::NnetTrainer
This class is for single-threaded training of neural nets using standard objective functions such as ...
Definition: nnet-training.h:180

kaldi::nnet3::NnetTrainerOptions::compute_config
NnetComputeOptions compute_config
Definition: nnet-training.h:49

kaldi::nnet3::NnetTrainer::num_minibatches_processed_
int32 num_minibatches_processed_
Definition: nnet-training.h:217

kaldi::nnet3::NnetTrainerOptions::backstitch_training_scale
BaseFloat backstitch_training_scale
Definition: nnet-training.h:41

kaldi::nnet3::NnetTrainerOptions::batchnorm_stats_scale
BaseFloat batchnorm_stats_scale
Definition: nnet-training.h:43

kaldi::nnet3::NnetTrainerOptions::zero_component_stats
bool zero_component_stats
Definition: nnet-training.h:35

kaldi::nnet3::ObjectiveFunctionInfo::tot_weight
double tot_weight
Definition: nnet-training.h:128