doc/nnet-optimize-test_8cc_source.html

 // nnet3/nnet-optimize-test.cc

 // Copyright 2015  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "nnet3/nnet-nnet.h"
 #include "nnet3/nnet-compile.h"
 #include "nnet3/nnet-analyze.h"
 #include "nnet3/nnet-test-utils.h"
 #include "nnet3/nnet-optimize.h"
 #include "nnet3/nnet-compute.h"

 namespace kaldi {
 namespace nnet3 {

 // Run the test without optimizations and with optimizations specified by the
 // configs (the optimized version is done with class CachingOptimizingCompiler).
 // Only print warnings; we'll fail the whole test later.
 static bool UnitTestNnetOptimizeWithOptions(int32 srand_seed,
                                             NnetOptimizeOptions opt_config,
                                             CachingOptimizingCompilerOptions compiler_config) {

   //opt_config.convert_addition = false;
   //opt_config.remove_assignments = false;
   //opt_config.move_sizing_commands = false;
   //opt_config.allocate_from_other = false;

   srand(srand_seed);  // so that we can compare between differnt optimization types
                       // with the randomly generated network staying the same.

   struct NnetGenerationOptions gen_config;

   std::vector<std::string> configs;
   GenerateConfigSequence(gen_config, &configs);
   Nnet nnet;
   for (size_t j = 0; j < configs.size(); j++) {
     KALDI_LOG << "Input config[" << j << "] is: " << configs[j];
     std::istringstream is(configs[j]);
     nnet.ReadConfig(is);
   }

   ComputationRequest request;
   std::vector<Matrix<BaseFloat> > inputs;
   ComputeExampleComputationRequestSimple(nnet, &request, &inputs);

   NnetComputation computation;
   Compiler compiler(request, nnet);

   CompilerOptions opts;
   compiler.CreateComputation(opts, &computation);
   {
     std::ostringstream os;
     computation.Print(os, nnet);
     KALDI_LOG << "Generated computation with no optimization or shortcut is: " << os.str();
   }
   CheckComputationOptions check_config;
   // we can do the rewrite check since it's before optimization.
   check_config.check_rewrite = true;
   ComputationChecker checker(check_config, nnet, computation);
   checker.Check();

   CachingOptimizingCompiler opt_compiler(nnet, opt_config, compiler_config);

   const NnetComputation &computation_opt = *opt_compiler.Compile(request);

   {
     std::ostringstream os;
     computation_opt.Print(os, nnet);
     KALDI_LOG << "Optimized computation is: " << os.str();
   }

   NnetComputeOptions compute_opts;
   if (RandInt(0, 1) == 0)
     compute_opts.debug = true;

   computation.ComputeCudaIndexes();
   // computation_opt has already had this function called.

   Nnet nnet_to_update(nnet);  // copy of the nnet that we update...  needed to
   // test the consolidation of backprop commands,
   // otherwise the optimized and non-optimized
   // comptuations differ.
   ScaleNnet(0.0, &nnet_to_update);
   // with natural gradient, the consolidation would affect the final model
   // params -> test just the gradient.
   SetNnetAsGradient(&nnet_to_update);

   NnetComputer computer(compute_opts,
                         computation,
                         nnet,
                         &nnet_to_update);

   Nnet nnet_opt(nnet);  // copy of the nnet for the optimized computation.
   // necessary in case backprop changes parameters.
   Nnet nnet_opt_to_update(nnet_opt);
   ScaleNnet(0.0, &nnet_opt_to_update);
   SetNnetAsGradient(&nnet_opt_to_update);

   // NnetComputer for the optimized version of the computation.
   NnetComputer computer_opt(compute_opts,
                             computation_opt,
                             nnet_opt,
                             &nnet_opt_to_update);

   // provide the input to the computations.
   for (size_t i = 0; i < request.inputs.size(); i++) {
     CuMatrix<BaseFloat> temp(inputs[i]);
     KALDI_LOG << "Input sum is " << temp.Sum();
     computer.AcceptInput(request.inputs[i].name, &temp);
     CuMatrix<BaseFloat> temp2(inputs[i]);
     computer_opt.AcceptInput(request.inputs[i].name, &temp2);
   }


   KALDI_LOG << "Running non-optimized forward computation";
   srand(srand_seed);
   ResetGenerators(&nnet);
   computer.Run();
   KALDI_LOG << "Running optimized forward computation";
   srand(srand_seed);
   ResetGenerators(&nnet_opt);
   computer_opt.Run();

   const CuMatrixBase<BaseFloat> &output(computer.GetOutput("output"));
   KALDI_LOG << "Output sum (not optimized) is " << output.Sum();
   const CuMatrixBase<BaseFloat> &output_opt(computer_opt.GetOutput("output"));
   KALDI_LOG << "Output sum (optimized) is " << output_opt.Sum();
   if (!ApproxEqual(output, output_opt)) {
     KALDI_WARN << "Non-optimized and optimized versions of the computation give "
                << "different outputs: " << output << " vs. " << output_opt;
     return false;
   }

   CuMatrix<BaseFloat> output_deriv(output.NumRows(), output.NumCols());
   output_deriv.SetRandn();
   CuMatrix<BaseFloat> output_deriv_opt(output_deriv);

   if (request.outputs[0].has_deriv) {
     computer.AcceptInput("output", &output_deriv);
     computer_opt.AcceptInput("output", &output_deriv_opt);

     KALDI_LOG << "Running non-optimized backward computation";
     computer.Run();
     KALDI_LOG << "Running optimized backward computation";
     computer_opt.Run();
     for (size_t i = 0; i < request.inputs.size(); i++) {
       if (request.inputs[i].has_deriv) {
         const CuMatrixBase<BaseFloat> &in_deriv =
             computer.GetOutput(request.inputs[i].name);
         const CuMatrixBase<BaseFloat> &in_deriv_opt =
             computer_opt.GetOutput(request.inputs[i].name);
         KALDI_LOG << "Input-deriv sum for input '" << request.inputs[i].name
                   << "' (non-optimized) is " << in_deriv.Sum();
         KALDI_LOG << "Input-deriv sum for input '" << request.inputs[i].name
                   << "' (optimized) is " << in_deriv_opt.Sum();
         if (!ApproxEqual(in_deriv, in_deriv_opt)) {
           KALDI_WARN << "Non-optimized and optimized versions of the "
                      << "computation give different input-derivs.";
           return false;
         }
       }
     }
   }

   if (!NnetParametersAreIdentical(nnet_to_update,
                                   nnet_opt_to_update, 1.0e-05)) {
     KALDI_WARN << "Neural networks differ after training, between "
                << "optimized and non-optimized computation.";
     return false;
   } else {
     return true;
   }
 }


 // This test runs the computation with and without optimization, and checks that
 // the outputs are the same.
 static void UnitTestNnetOptimizeInternal(int32 srand_seed) {
   NnetOptimizeOptions optimize_all;
   CachingOptimizingCompilerOptions compiler_all;

   // randomly sometimes set min_deriv and max_deriv to small/large values,
   // which will cause some of the LimitDerivativeTimes() code to be called
   // (without really changing anything).
   if (RandInt(0, 3) == 0) optimize_all.min_deriv_time = -200;
   if (RandInt(0, 3) == 0) optimize_all.max_deriv_time = 1000;

   // this is useful for debugging as it removes nans:
   // optimize_all.initialize_undefined = false;
   bool success = UnitTestNnetOptimizeWithOptions(srand_seed, optimize_all,
                                                  compiler_all);
   if (success)
     return;

   // Test failed with full optimization. Slowly retry with various
   // optimizations switched off.
   NnetOptimizeOptions optimize = optimize_all;
   CachingOptimizingCompilerOptions compiler = compiler_all;


   compiler.use_shortcut = false;
   bool succ_no_shortcut = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                           compiler);
   compiler = compiler_all;


   optimize.propagate_in_place = false;
   bool succ_no_propagate_in_place = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                                     compiler);
   optimize = optimize_all;

   optimize.backprop_in_place = false;
   bool succ_no_backprop_in_place = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                                    compiler);
   optimize = optimize_all;

   optimize.optimize_row_ops = false;
   bool succ_no_row_ops = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                          compiler);
   optimize = optimize_all;

   optimize.convert_addition = false;
   bool succ_no_convert_addition = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                                   compiler);
   optimize = optimize_all;

   optimize.remove_assignments = false;
   bool succ_no_remove_assignments = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                                     compiler);
   optimize = optimize_all;

   optimize.initialize_undefined = false;
   bool succ_no_initialize_undefined = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                                       compiler);
   optimize = optimize_all;

   optimize.allocate_from_other = false;
   bool succ_no_allocate_from_other = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                                      compiler);
   optimize = optimize_all;

   optimize.move_sizing_commands = false;
   bool succ_no_move_sizing_commands = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                                       compiler);
   optimize = optimize_all;

   optimize.snip_row_ops = false;
   bool succ_no_snip_row_ops = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                               compiler);
   optimize = optimize_all;


   optimize.min_deriv_time = std::numeric_limits<int32>::min();
   optimize.max_deriv_time = std::numeric_limits<int32>::max();
   optimize.max_deriv_time_relative = std::numeric_limits<int32>::max();
   bool succ_no_deriv_time = UnitTestNnetOptimizeWithOptions(srand_seed, optimize,
                                                             compiler);
   optimize = optimize_all;


 #define KALDI_SUCCFAIL(b) ((b) ? "SUCCESS" : "FAILURE")
   KALDI_ERR
     << "Test failed with all optimizations enabled. Retried test with the "
     << "following optimizations turned off:"
     << "\n  use_shortcut         ... " << KALDI_SUCCFAIL(succ_no_shortcut)
     << "\n  propagate_in_place   ... " << KALDI_SUCCFAIL(succ_no_propagate_in_place)
     << "\n  backprop_in_place    ... " << KALDI_SUCCFAIL(succ_no_backprop_in_place)
     << "\n  optimize_row_ops     ... " << KALDI_SUCCFAIL(succ_no_row_ops)
     << "\n  convert_addition     ... " << KALDI_SUCCFAIL(succ_no_convert_addition)
     << "\n  remove_assignments   ... " << KALDI_SUCCFAIL(succ_no_remove_assignments)
     << "\n  initialize_undefined ... " << KALDI_SUCCFAIL(succ_no_initialize_undefined)
     << "\n  allocate_from_other  ... " << KALDI_SUCCFAIL(succ_no_allocate_from_other)
     << "\n  move_sizing_commands ... " << KALDI_SUCCFAIL(succ_no_move_sizing_commands)
     << "\n  snip_row_ops         ... " << KALDI_SUCCFAIL(succ_no_snip_row_ops)
     << "\n  no_deriv_time        ... " << KALDI_SUCCFAIL(succ_no_deriv_time);
 #undef KALDI_SUCCFAIL
 }

 static void UnitTestNnetOptimize() {
   for (int32 srand_seed = 0; srand_seed < 40; srand_seed++) {
     KALDI_LOG << "About to run UnitTestNnetOptimizeInternal with srand_seed = "
               << srand_seed;
     UnitTestNnetOptimizeInternal(srand_seed);
   }
 }


 } // namespace nnet3
 } // namespace kaldi

 int main() {
   using namespace kaldi;
   using namespace kaldi::nnet3;
   SetVerboseLevel(3);

 #if HAVE_CUDA == 1
   CuDevice::Instantiate().SetDebugStrideMode(true);
   CuDevice::Instantiate().SelectGpuId("no");
   UnitTestNnetOptimize();
   CuDevice::Instantiate().SelectGpuId("yes");
 #endif
   UnitTestNnetOptimize();

   KALDI_LOG << "Nnet tests succeeded.";

   return 0;
 }
kaldi::nnet3::UnitTestNnetOptimizeInternal
static void UnitTestNnetOptimizeInternal(int32 srand_seed)
Definition: nnet-optimize-test.cc:194

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

nnet-compute.h

kaldi::nnet3::NnetOptimizeOptions::allocate_from_other
bool allocate_from_other
Definition: nnet-optimize.h:51

kaldi::nnet3::ScaleNnet
void ScaleNnet(BaseFloat scale, Nnet *nnet)
Scales the nnet parameters and stats by this scale.
Definition: nnet-utils.cc:312

kaldi::nnet3::NnetOptimizeOptions::optimize_row_ops
bool optimize_row_ops
Definition: nnet-optimize.h:42

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

nnet-nnet.h

kaldi::nnet3::Nnet::ReadConfig
void ReadConfig(std::istream &config_file)
Definition: nnet-nnet.cc:189

kaldi::nnet3::NnetParametersAreIdentical
bool NnetParametersAreIdentical(const Nnet &nnet1, const Nnet &nnet2, BaseFloat threshold=1.0e-05)
Used for testing that the updatable parameters in two networks are the same.
Definition: nnet-test-utils.cc:1802

kaldi::nnet3::NnetOptimizeOptions::max_deriv_time_relative
int32 max_deriv_time_relative
Definition: nnet-optimize.h:54

KALDI_SUCCFAIL
#define KALDI_SUCCFAIL(b)

kaldi::nnet3::NnetComputation::ComputeCudaIndexes
void ComputeCudaIndexes()
Definition: nnet-computation.cc:84

kaldi::nnet3::NnetOptimizeOptions::move_sizing_commands
bool move_sizing_commands
Definition: nnet-optimize.h:50

kaldi::nnet3::CachingOptimizingCompiler
This class enables you to do the compilation and optimization in one call, and also ensures that if t...
Definition: nnet-optimize.h:219

kaldi::nnet3::NnetOptimizeOptions::remove_assignments
bool remove_assignments
Definition: nnet-optimize.h:46

kaldi::CuMatrixBase::Sum
Real Sum() const
Definition: cu-matrix.cc:3012

nnet-test-utils.h
This file contains various routines that are useful in test code.

kaldi::nnet3::NnetComputation::Print
void Print(std::ostream &os, const Nnet &nnet) const
Definition: nnet-computation.cc:717

kaldi::nnet3::NnetComputeOptions::debug
bool debug
Definition: nnet-compute.h:40

nnet-analyze.h
This file contains utilities for analyzing and checking computations, which are used in the optimizat...

kaldi::CuMatrixBase::SetRandn
void SetRandn()
Definition: cu-matrix.cc:3132

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::NnetGenerationOptions
Definition: nnet-test-utils.h:33

kaldi::nnet3::ComputationChecker
Definition: nnet-analyze.h:411

kaldi::nnet3::ComputationRequest::inputs
std::vector< IoSpecification > inputs
Definition: nnet-computation.h:115

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet3::UnitTestNnetOptimizeWithOptions
static bool UnitTestNnetOptimizeWithOptions(int32 srand_seed, NnetOptimizeOptions opt_config, CachingOptimizingCompilerOptions compiler_config)
Definition: nnet-optimize-test.cc:33

kaldi::nnet3::NnetOptimizeOptions::min_deriv_time
int32 min_deriv_time
Definition: nnet-optimize.h:52

kaldi::nnet3
Definition: dnn3_code_compilation.dox:22

kaldi::nnet3::NnetComputeOptions
Definition: nnet-compute.h:39

kaldi::nnet3::SetNnetAsGradient
void SetNnetAsGradient(Nnet *nnet)
Sets nnet as gradient by Setting is_gradient_ to true and learning_rate_ to 1 for each UpdatableCompo...
Definition: nnet-utils.cc:292

kaldi::nnet3::CachingOptimizingCompilerOptions
Definition: nnet-optimize.h:192

kaldi::nnet3::NnetOptimizeOptions::snip_row_ops
bool snip_row_ops
Definition: nnet-optimize.h:55

kaldi::SetVerboseLevel
void SetVerboseLevel(int32 i)
This should be rarely used, except by programs using Kaldi as library; command-line programs set the ...
Definition: kaldi-error.h:64

nnet-optimize.h

kaldi::nnet3::NnetComputer::AcceptInput
void AcceptInput(const std::string &node_name, CuMatrix< BaseFloat > *input)
e.g.
Definition: nnet-compute.cc:547

kaldi::nnet3::ResetGenerators
void ResetGenerators(Nnet *nnet)
This function calls &#39;ResetGenerator()&#39; on all components in &#39;nnet&#39; that inherit from class RandomComp...
Definition: nnet-utils.cc:582

kaldi::nnet3::CompilerOptions
Definition: nnet-compile.h:34

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::nnet3::ComputeExampleComputationRequestSimple
void ComputeExampleComputationRequestSimple(const Nnet &nnet, ComputationRequest *request, std::vector< Matrix< BaseFloat > > *inputs)
This function computes an example computation request, for testing purposes.
Definition: nnet-test-utils.cc:1338

kaldi::nnet3::NnetComputer::GetOutput
const CuMatrixBase< BaseFloat > & GetOutput(const std::string &node_name)
Definition: nnet-compute.cc:578

kaldi::nnet3::NnetOptimizeOptions::convert_addition
bool convert_addition
Definition: nnet-optimize.h:45

kaldi::nnet3::NnetOptimizeOptions::propagate_in_place
bool propagate_in_place
Definition: nnet-optimize.h:40

kaldi::nnet3::NnetOptimizeOptions
Definition: nnet-optimize.h:35

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::nnet3::UnitTestNnetOptimize
static void UnitTestNnetOptimize()
Definition: nnet-optimize-test.cc:295

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

nnet-compile.h

kaldi::nnet3::CheckComputationOptions::check_rewrite
bool check_rewrite
Definition: nnet-analyze.h:394

kaldi::nnet3::ComputationChecker::Check
void Check()
Definition: nnet-analyze.cc:579

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::CachingOptimizingCompiler::Compile
std::shared_ptr< const NnetComputation > Compile(const ComputationRequest &request)
Does the compilation and returns a const pointer to the result, which is owned by this class...
Definition: nnet-optimize.cc:716

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::nnet3::CachingOptimizingCompilerOptions::use_shortcut
bool use_shortcut
Definition: nnet-optimize.h:193

kaldi::nnet3::NnetComputer
class NnetComputer is responsible for executing the computation described in the "computation" object...
Definition: nnet-compute.h:59

kaldi::nnet3::Compiler::CreateComputation
void CreateComputation(const CompilerOptions &opts, NnetComputation *computation)
Definition: nnet-compile.cc:50

kaldi::nnet3::NnetComputation
Definition: nnet-computation.h:303

kaldi::nnet3::ComputationRequest::outputs
std::vector< IoSpecification > outputs
Definition: nnet-computation.h:116

kaldi::nnet3::NnetOptimizeOptions::backprop_in_place
bool backprop_in_place
Definition: nnet-optimize.h:41

kaldi::nnet3::Compiler
This class creates an initial version of the NnetComputation, without any optimization or sharing of ...
Definition: nnet-compile.h:44

kaldi::nnet3::NnetOptimizeOptions::max_deriv_time
int32 max_deriv_time
Definition: nnet-optimize.h:53

kaldi::nnet3::GenerateConfigSequence
void GenerateConfigSequence(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Generates a sequence of at least one config files, output as strings, where the first in the sequence...
Definition: nnet-test-utils.cc:1252

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::nnet3::CheckComputationOptions
Definition: nnet-analyze.h:391

kaldi::nnet3::NnetOptimizeOptions::initialize_undefined
bool initialize_undefined
Definition: nnet-optimize.h:49

kaldi::ApproxEqual
static bool ApproxEqual(float a, float b, float relative_tolerance=0.001)
return abs(a - b) <= relative_tolerance * (abs(a)+abs(b)).
Definition: kaldi-math.h:265

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95

kaldi::nnet3::NnetComputer::Run
void Run()
This does either the forward or backward computation, depending when it is called (in a typical compu...
Definition: nnet-compute.cc:512

main
int main()
Definition: nnet-optimize-test.cc:308