doc/nnet-optimize_8h_source.html

 // nnet3/nnet-optimize.h

 // Copyright      2015-2016  Johns Hopkins University (author: Daniel Povey)
 //                2015       Xiaohui Zhang

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_NNET3_NNET_OPTIMIZE_H_
 #define KALDI_NNET3_NNET_OPTIMIZE_H_

 #include "nnet3/nnet-compile.h"
 #include "nnet3/nnet-analyze.h"
 #include "nnet3/nnet-optimize-utils.h"

 namespace kaldi {
 namespace nnet3 {

 // Options class for optimizing a NnetComputation.  The main projected use for
 // this is in debugging the optimization code itself, so that if an error is
 // detected, we can work out which optimization was responsible for the error.
 // See the Register() function below for option-specific documentation.
 struct NnetOptimizeOptions {
   // Caution: if adding or removing members, the Read and Write functions and
   // the == operator should be modified.  This relates to computation caching.
   bool optimize;  // setting this false disallow all optimization.
   bool consolidate_model_update;
   bool propagate_in_place;
   bool backprop_in_place;
   bool optimize_row_ops;
   bool split_row_ops;
   bool extend_matrices;
   bool convert_addition;
   bool remove_assignments;
   bool allow_left_merge;
   bool allow_right_merge;
   bool initialize_undefined;
   bool move_sizing_commands;
   bool allocate_from_other;
   int32 min_deriv_time;
   int32 max_deriv_time;
   int32 max_deriv_time_relative;
   bool snip_row_ops;
   int32 memory_compression_level;
   // optimize_looped_computation is a 'hidden config' not available from
   // the command line; it's set to true to enable the optimization for
   // looped computation that turns a linear computation into a loop.
   bool optimize_looped_computation;

   NnetOptimizeOptions():
       optimize(true),
       consolidate_model_update(true),
       propagate_in_place(true),
       backprop_in_place(true),
       optimize_row_ops(true),
       split_row_ops(true),
       extend_matrices(true),
       convert_addition(true),
       remove_assignments(true),
       allow_left_merge(true),
       allow_right_merge(true),
       initialize_undefined(true),
       move_sizing_commands(true),
       allocate_from_other(true),
       min_deriv_time(std::numeric_limits<int32>::min()),
       max_deriv_time(std::numeric_limits<int32>::max()),
       max_deriv_time_relative(std::numeric_limits<int32>::max()),
       snip_row_ops(true),
       memory_compression_level(1),
       optimize_looped_computation(false) { }

   void Register(OptionsItf *opts) {
     opts->Register("optimize", &optimize, "Set this to false to turn off all "
                  "optimizations");
     opts->Register("consolidate-model-update", &consolidate_model_update,
                    "Set to false to disable optimization that consolidates "
                    "the model-update phase of backprop (e.g. for recurrent "
                    "architectures");
     opts->Register("propagate-in-place", &propagate_in_place, "Set to false to "
                    "disable optimization that allows in-place propagation");
     opts->Register("backprop-in-place", &backprop_in_place, "Set to false to "
                    "disable optimization that allows in-place backprop");
     opts->Register("extend-matrices", &extend_matrices, "This optimization "
                    "can reduce memory requirements for TDNNs when applied "
                    "together with --convert-addition=true");
     opts->Register("optimize-row-ops", &optimize_row_ops, "Set to false to "
                    "disable certain optimizations that act on operations of "
                    "type *Row*.");
     opts->Register("split-row-ops", &split_row_ops, "Set to false to disable "
                    "an optimization that may replace some operations of type "
                    "kCopyRowsMulti or kAddRowsMulti with up to two simpler "
                    "operations.");
     opts->Register("convert-addition", &convert_addition, "Set to false to "
                    "disable the optimization that converts Add commands into "
                    "Copy commands wherever possible.");
     opts->Register("remove-assignments", &remove_assignments, "Set to false to "
                    "disable optimization that removes redundant assignments");
     opts->Register("allow-left-merge", &allow_left_merge, "Set to false to "
                    "disable left-merging of variables in remove-assignments "
                    "(obscure option)");
     opts->Register("allow-right-merge", &allow_right_merge, "Set to false to "
                    "disable right-merging of variables in remove-assignments "
                    "(obscure option)");
     opts->Register("initialize-undefined", &initialize_undefined, "Set to false "
                    "to disable optimization that avoids redundant zeroing");
     opts->Register("move-sizing-commands", &move_sizing_commands, "Set to false "
                    "to disable optimization that moves matrix allocation and "
                    "deallocation commands to conserve memory.");
     opts->Register("allocate-from-other", &allocate_from_other, "Instead of "
                    "deleting a matrix of a given size and then allocating "
                    "a matrix of the same size, allow re-use of that memory");
     opts->Register("min-deriv-time", &min_deriv_time, "You can set this to "
                    "the minimum t value that you want derivatives to be computed "
                    "at when updating the model.  This is an optimization that "
                    "saves time in the backprop phase for recurrent frameworks");
     opts->Register("max-deriv-time", &max_deriv_time, "You can set this to "
                    "the maximum t value that you want derivatives to be computed "
                    "at when updating the model.  This is an optimization that "
                    "saves time in the backprop phase for recurrent frameworks");
     opts->Register("max-deriv-time-relative", &max_deriv_time_relative,
                    "An alternative mechanism for setting the --max-deriv-time, "
                    "suitable for situations where the length of the egs is "
                    "variable.  If set, it is equivalent to setting the "
                    "--max-deriv-time to this value plus the largest 't' value "
                    "in any 'output' node of the computation request.");
     opts->Register("snip-row-ops", &snip_row_ops, "Set this to false to "
                    "disable an optimization that reduces the size of certain "
                    "per-row operations");
     opts->Register("memory-compression-level", &memory_compression_level,
                    "This is only relevant to training, not decoding.  Set this "
                    "to 0,1,2; higher levels are more aggressive at reducing "
                    "memory by compressing quantities needed for backprop, "
                    "potentially at the expense of speed and the accuracy "
                    "of derivatives.  0 means no compression at all; 1 means "
                    "compression that shouldn't affect results at all.");

   }
   void Read(std::istream &is, bool binary);
   void Write(std::ostream &os, bool binary) const;
   bool operator == (const NnetOptimizeOptions &other) const;
 };


 /* This utility function, used in code that calls LimitDerivativeTimes() (and
    required in code that calls Optimize(), returns the largest time
    't' in any of the 'outputs' in the computation request, or crashes if there
    are no outputs (or no cindexes in those outputs). */
 int32 MaxOutputTimeInRequest(const ComputationRequest &request);


 void Optimize(const NnetOptimizeOptions &config,
               const Nnet &nnet,
               int32 max_output_time_in_request,
               NnetComputation *computation);


 struct CachingOptimizingCompilerOptions {
   bool use_shortcut;
   int32 cache_capacity;

   CachingOptimizingCompilerOptions():
       use_shortcut(true),
       cache_capacity(64) { }

   void Register(OptionsItf *opts) {
     opts->Register("use-shortcut", &use_shortcut,
                    "If true, use the 'shortcut' in compilation whereby "
                    "computation requests with regular structure are identified "
                    "as such, a computation with a smaller number of distinct "
                    "values of 'n' is compiled (e.g. 2), and the compiled "
                    "computation is expanded to match the size of the real "
                    "computation request.");
     opts->Register("cache-capacity", &cache_capacity,
                    "Determines how many computations the computation-cache will "
                    "store (most-recently-used).");
   }
 };

 class CachingOptimizingCompiler {
  public:
   CachingOptimizingCompiler(const Nnet &nnet,
                             const CachingOptimizingCompilerOptions config =
                             CachingOptimizingCompilerOptions());

   CachingOptimizingCompiler(const Nnet &nnet,
                             const NnetOptimizeOptions &opt_config,
                             const CachingOptimizingCompilerOptions config =
                             CachingOptimizingCompilerOptions());

   ~CachingOptimizingCompiler();

   std::shared_ptr<const NnetComputation> Compile(
       const ComputationRequest &request);
   void ReadCache(std::istream &is, bool binary);
   void WriteCache(std::ostream &os, bool binary);


   // GetSimpleNnetContext() is equivalent to calling:
   // ComputeSimpleNnetContext(nnet_, &nnet_left_context,
   //                          &nnet_right_context)
   // but it caches it inside this class.  This functionality is independent of
   // the rest of the functionality of this class; it just happens to be a
   // convenient place to put this mechanism.
   void GetSimpleNnetContext(int32 *nnet_left_context,
                             int32 *nnet_right_context);

  private:

   // This function just implements the work of Compile(); it's made a separate
   // function for the convenience of the timer code, to avoid it being called
   // twice (we also call this function directly from inside the class).
   std::shared_ptr<const NnetComputation> CompileInternal(const ComputationRequest &request);

   // This function, called from CompileInternal(), is called when a
   // ComputationRequest has been determined not to have already been cached.  It
   // otherwise has the same interface as CompileInternal(), but assumes that
   // there is nothing cached for this computation as yet.  It compiles the
   // computation and takes care of caching it.
   std::shared_ptr<const NnetComputation> CompileAndCache(const ComputationRequest &request);


   // This function, called from CompileInternal(), tries to compile the
   // ComputationRequest 'request' via 'shortcut' compilation; if this is
   // possible, it returns a pointer to a newly allocated computation that it has
   // compiled this way (note: this computation will not yet have been placed in
   // the computation cache).  If this is not possible for some reason
   // (e.g. shortcut compilation is disabled in the config; or the computation
   // request was not decomposable because of too few n values or irregular or
   // unexpected structure), this function returns NULL and you should compile
   // via CompileNoShortcut.
   const NnetComputation *CompileViaShortcut(const ComputationRequest &request);

   // This function, called from CompileInternal(), tries to compile the
   // ComputationRequest 'request' via the regular (not shortcut) compilation
   // process; it returns a pointer to a newly allocated computation that it has
   // compiled this way (note: this computation will not yet have been placed in
   // the computation cache).
   const NnetComputation *CompileNoShortcut(const ComputationRequest &request);

   const Nnet &nnet_;
   CachingOptimizingCompilerOptions config_;
   NnetOptimizeOptions opt_config_;


   // seconds spent in various phases of compilation-- for diagnostic messages
   double seconds_taken_total_;
   double seconds_taken_compile_;
   double seconds_taken_optimize_;
   double seconds_taken_expand_;
   double seconds_taken_check_;
   double seconds_taken_indexes_;
   double seconds_taken_io_;

   ComputationCache cache_;

   // These following two variables are only used by the function GetSimpleNnetContext().
   int32 nnet_left_context_;
   int32 nnet_right_context_;
 };


 void LimitDerivativeTimes(const Nnet &nnet,
                           const ComputationRequest &request,
                           const NnetOptimizeOptions &opts,
                           NnetComputation *computation);

 void ConsolidateModelUpdate(const Nnet &nnet,
                             NnetComputation *computation);

 void ConvertAdditionToAssignment(const Nnet &nnet,
                                  NnetComputation *computation);


 void VariableMergingOptimization(const NnetOptimizeOptions &config,
                                  const Nnet &nnet,
                                  NnetComputation *computation);


 void RemoveUnnecessaryZeroing(const Nnet &nnet, NnetComputation *computation);


 void MoveSizingCommands(const Nnet &nnet, NnetComputation *computation);

 void RemoveUnnecessaryAllocation(const Nnet &nnet,
                                  NnetComputation *computation);


 void ConsolidateIoOperations(const Nnet &nnet,
                              NnetComputation *computation);


 } // namespace nnet3
 } // namespace kaldi


 #endif
kaldi::nnet3::CachingOptimizingCompiler::seconds_taken_check_
double seconds_taken_check_
Definition: nnet-optimize.h:298

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::NnetOptimizeOptions::allocate_from_other
bool allocate_from_other
Definition: nnet-optimize.h:51

kaldi::nnet3::NnetOptimizeOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-optimize.h:84

kaldi::nnet3::NnetOptimizeOptions::allow_right_merge
bool allow_right_merge
Definition: nnet-optimize.h:48

kaldi::nnet3::NnetOptimizeOptions::optimize_row_ops
bool optimize_row_ops
Definition: nnet-optimize.h:42

kaldi::nnet3::CachingOptimizingCompilerOptions::CachingOptimizingCompilerOptions
CachingOptimizingCompilerOptions()
Definition: nnet-optimize.h:196

kaldi::nnet3::NnetOptimizeOptions::Read
void Read(std::istream &is, bool binary)
Definition: nnet-optimize.cc:30

kaldi::nnet3::NnetOptimizeOptions::max_deriv_time_relative
int32 max_deriv_time_relative
Definition: nnet-optimize.h:54

kaldi::nnet3::ConsolidateIoOperations
void ConsolidateIoOperations(const Nnet &nnet, NnetComputation *computation)
This optimization puts the input operations (kAcceptInput) and output operations (kProvideOutput) at ...
Definition: nnet-optimize.cc:869

kaldi::nnet3::CachingOptimizingCompiler::cache_
ComputationCache cache_
Definition: nnet-optimize.h:302

kaldi::nnet3::NnetOptimizeOptions::Write
void Write(std::ostream &os, bool binary) const
Definition: nnet-optimize.cc:85

kaldi::Compile
ArpaLmCompiler * Compile(bool seps, const std::string &infile)
Definition: arpa-lm-compiler-test.cc:75

kaldi::nnet3::NnetOptimizeOptions::move_sizing_commands
bool move_sizing_commands
Definition: nnet-optimize.h:50

kaldi::nnet3::CachingOptimizingCompiler
This class enables you to do the compilation and optimization in one call, and also ensures that if t...
Definition: nnet-optimize.h:219

kaldi::nnet3::NnetOptimizeOptions::remove_assignments
bool remove_assignments
Definition: nnet-optimize.h:46

kaldi::nnet3::CachingOptimizingCompilerOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-optimize.h:200

kaldi::nnet3::VariableMergingOptimization
void VariableMergingOptimization(const NnetOptimizeOptions &config, const Nnet &nnet, NnetComputation *computation)
This wraps class VariableMergingOptimizer in a simplified interface.
Definition: nnet-optimize.cc:417

nnet-analyze.h
This file contains utilities for analyzing and checking computations, which are used in the optimizat...

kaldi::nnet3::ConvertAdditionToAssignment
void ConvertAdditionToAssignment(const Nnet &nnet, NnetComputation *computation)
This converts addition operations (things with Add in their names) to copy operations (things with Co...
Definition: nnet-optimize.cc:430

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::CachingOptimizingCompiler::nnet_
const Nnet & nnet_
Definition: nnet-optimize.h:288

kaldi::nnet3::NnetOptimizeOptions::min_deriv_time
int32 min_deriv_time
Definition: nnet-optimize.h:52

kaldi::nnet3::LimitDerivativeTimes
void LimitDerivativeTimes(const Nnet &nnet, int32 min_deriv_time, int32 max_deriv_time, NnetComputation *computation)
Definition: nnet-optimize-utils.cc:2215

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi::nnet3::CachingOptimizingCompilerOptions
Definition: nnet-optimize.h:192

kaldi::nnet3::NnetOptimizeOptions::optimize_looped_computation
bool optimize_looped_computation
Definition: nnet-optimize.h:60

kaldi::nnet3::NnetOptimizeOptions::snip_row_ops
bool snip_row_ops
Definition: nnet-optimize.h:55

kaldi::nnet3::NnetOptimizeOptions::split_row_ops
bool split_row_ops
Definition: nnet-optimize.h:43

kaldi::nnet3::MoveSizingCommands
void MoveSizingCommands(const Nnet &nnet, NnetComputation *computation)
This optimization moves commands that allocate and zero matrices to as late as possible, and moves commands that deallocate matrices to as early as possible.
Definition: nnet-optimize.cc:152

kaldi::nnet3::NnetOptimizeOptions::optimize
bool optimize
Definition: nnet-optimize.h:38

kaldi::nnet3::CachingOptimizingCompiler::seconds_taken_expand_
double seconds_taken_expand_
Definition: nnet-optimize.h:297

kaldi::nnet3::NnetOptimizeOptions::consolidate_model_update
bool consolidate_model_update
Definition: nnet-optimize.h:39

kaldi::nnet3::NnetOptimizeOptions::NnetOptimizeOptions
NnetOptimizeOptions()
Definition: nnet-optimize.h:62

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::nnet3::NnetOptimizeOptions::operator==
bool operator==(const NnetOptimizeOptions &other) const
Definition: nnet-optimize.cc:128

kaldi::nnet3::CachingOptimizingCompilerOptions::cache_capacity
int32 cache_capacity
Definition: nnet-optimize.h:194

kaldi::nnet3::CachingOptimizingCompiler::seconds_taken_io_
double seconds_taken_io_
Definition: nnet-optimize.h:300

kaldi::nnet3::CachingOptimizingCompiler::seconds_taken_total_
double seconds_taken_total_
Definition: nnet-optimize.h:294

kaldi::nnet3::MaxOutputTimeInRequest
int32 MaxOutputTimeInRequest(const ComputationRequest &request)
Definition: nnet-optimize.cc:484

kaldi::nnet3::RemoveUnnecessaryAllocation
void RemoveUnnecessaryAllocation(const Nnet &nnet, NnetComputation *computation)
This optimization detects cases where we deallocate a matrix, and then later allocate another matrix ...
Definition: nnet-optimize.cc:355

kaldi::nnet3::RemoveUnnecessaryZeroing
void RemoveUnnecessaryZeroing(const Nnet &nnet, NnetComputation *computation)
This optimization function removes, where possible, commands of type type kSetConst.
Definition: nnet-optimize.cc:262

kaldi::nnet3::NnetOptimizeOptions::convert_addition
bool convert_addition
Definition: nnet-optimize.h:45

kaldi::nnet3::NnetOptimizeOptions::propagate_in_place
bool propagate_in_place
Definition: nnet-optimize.h:40

kaldi::nnet3::NnetOptimizeOptions
Definition: nnet-optimize.h:35

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

kaldi::nnet3::NnetOptimizeOptions::memory_compression_level
int32 memory_compression_level
Definition: nnet-optimize.h:56

nnet-compile.h

kaldi::nnet3::CachingOptimizingCompiler::seconds_taken_compile_
double seconds_taken_compile_
Definition: nnet-optimize.h:295

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::nnet3::CachingOptimizingCompiler::seconds_taken_optimize_
double seconds_taken_optimize_
Definition: nnet-optimize.h:296

kaldi::nnet3::Optimize
void Optimize(const NnetOptimizeOptions &config, const Nnet &nnet, int32 max_output_time_in_request, NnetComputation *computation)
This is the top-level function for optimizing a computation.
Definition: nnet-optimize.cc:501

kaldi::nnet3::NnetOptimizeOptions::extend_matrices
bool extend_matrices
Definition: nnet-optimize.h:44

kaldi::nnet3::ConsolidateModelUpdate
void ConsolidateModelUpdate(const Nnet &nnet, NnetComputation *computation)
This optimization consolidates the model-update part of backprop commands, for components in (e...
Definition: nnet-optimize-utils.cc:1551

kaldi::nnet3::CachingOptimizingCompilerOptions::use_shortcut
bool use_shortcut
Definition: nnet-optimize.h:193

kaldi::nnet3::CachingOptimizingCompiler::nnet_left_context_
int32 nnet_left_context_
Definition: nnet-optimize.h:305

kaldi::nnet3::NnetComputation
Definition: nnet-computation.h:303

kaldi::nnet3::NnetOptimizeOptions::allow_left_merge
bool allow_left_merge
Definition: nnet-optimize.h:47

kaldi::nnet3::CachingOptimizingCompiler::nnet_right_context_
int32 nnet_right_context_
Definition: nnet-optimize.h:306

kaldi::nnet3::NnetOptimizeOptions::backprop_in_place
bool backprop_in_place
Definition: nnet-optimize.h:41

kaldi::nnet3::NnetOptimizeOptions::max_deriv_time
int32 max_deriv_time
Definition: nnet-optimize.h:53

nnet-optimize-utils.h

kaldi::nnet3::CachingOptimizingCompiler::seconds_taken_indexes_
double seconds_taken_indexes_
Definition: nnet-optimize.h:299

kaldi::nnet3::CachingOptimizingCompiler::opt_config_
NnetOptimizeOptions opt_config_
Definition: nnet-optimize.h:290

kaldi::nnet3::ComputationCache
Class ComputationCache is used inside class CachingOptimizingCompiler to cache previously computed co...
Definition: nnet-optimize-utils.h:625

kaldi::nnet3::NnetOptimizeOptions::initialize_undefined
bool initialize_undefined
Definition: nnet-optimize.h:49

kaldi::nnet3::CachingOptimizingCompiler::config_
CachingOptimizingCompilerOptions config_
Definition: nnet-optimize.h:289