doc/nnet3-show-progress_8cc_source.html

 // nnet3bin/nnet3-show-progress.cc

 // Copyright 2015 Johns Hopkins University (author:  Daniel Povey)
 //           2015 Xingyu Na

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "hmm/transition-model.h"
 #include "nnet3/nnet-utils.h"
 #include "nnet3/nnet-diagnostics.h"

 int main(int argc, char *argv[]) {
   try {
     using namespace kaldi;
     using namespace kaldi::nnet3;
     typedef kaldi::int32 int32;
     typedef kaldi::int64 int64;

     const char *usage =
         "Given an old and a new 'raw' nnet3 network and some training examples\n"
         "(possibly held-out), show the average objective function given the\n"
         "mean of the two networks, and the breakdown by component of why this\n"
         "happened (computed from derivative information). Also shows parameter\n"
         "differences per layer. If training examples not provided, only shows\n"
         "parameter differences per layer.\n"
         "\n"
         "Usage:  nnet3-show-progress [options] <old-net-in> <new-net-in>"
         " [<training-examples-in>]\n"
         "e.g.: nnet3-show-progress 1.nnet 2.nnet ark:valid.egs\n";

     ParseOptions po(usage);

     int32 num_segments = 1;
     std::string use_gpu = "no";
     NnetComputeProbOptions compute_prob_opts;
     compute_prob_opts.compute_deriv = true;

     po.Register("num-segments", &num_segments,
                 "Number of line segments used for computing derivatives");
     po.Register("use-gpu", &use_gpu,
                 "yes|no|optional|wait, only has effect if compiled with CUDA");
     compute_prob_opts.Register(&po);

     po.Read(argc, argv);

     if (po.NumArgs() < 2 || po.NumArgs() > 3) {
       po.PrintUsage();
       exit(1);
     }

 #if HAVE_CUDA==1
     CuDevice::Instantiate().SelectGpuId(use_gpu);
 #endif

     std::string nnet1_rxfilename = po.GetArg(1),
                 nnet2_rxfilename = po.GetArg(2),
                 examples_rspecifier = po.GetOptArg(3);

     Nnet nnet1, nnet2;
     ReadKaldiObject(nnet1_rxfilename, &nnet1);
     ReadKaldiObject(nnet2_rxfilename, &nnet2);

     if (NumParameters(nnet1) != NumParameters(nnet2)) {
       KALDI_WARN << "Parameter-dim mismatch, cannot show progress.";
       exit(0);
     }

     if (!examples_rspecifier.empty() && IsSimpleNnet(nnet1)) {
       std::vector<NnetExample> examples;
       SequentialNnetExampleReader example_reader(examples_rspecifier);
       for (; !example_reader.Done(); example_reader.Next())
         examples.push_back(example_reader.Value());

       int32 num_examples = examples.size();

       if (num_examples == 0)
         KALDI_ERR << "No examples read.";

       int32 num_updatable = NumUpdatableComponents(nnet1);
       Vector<BaseFloat> diff(num_updatable);

       for (int32 s = 0; s < num_segments; s++) {
         // start and end segments of the line between 0 and 1
         BaseFloat start = (s + 0.0) / num_segments,
             end = (s + 1.0) / num_segments, middle = 0.5 * (start + end);
         Nnet interp_nnet(nnet2);
         ScaleNnet(middle, &interp_nnet);
         AddNnet(nnet1, 1.0 - middle, &interp_nnet);

         NnetComputeProb prob_computer(compute_prob_opts, interp_nnet);
         std::vector<NnetExample>::const_iterator eg_iter = examples.begin(),
                                                  eg_end = examples.end();
         for (; eg_iter != eg_end; ++eg_iter)
           prob_computer.Compute(*eg_iter);
         const SimpleObjectiveInfo *objf_info = prob_computer.GetObjective("output");
         double objf_per_frame = objf_info->tot_objective / objf_info->tot_weight;

         prob_computer.PrintTotalStats();
         const Nnet &nnet_gradient = prob_computer.GetDeriv();
         KALDI_LOG << "At position " << middle
                   << ", objf per frame is " << objf_per_frame;

         Vector<BaseFloat> old_dotprod(num_updatable), new_dotprod(num_updatable);
         ComponentDotProducts(nnet_gradient, nnet1, &old_dotprod);
         ComponentDotProducts(nnet_gradient, nnet2, &new_dotprod);
         old_dotprod.Scale(1.0 / objf_info->tot_weight);
         new_dotprod.Scale(1.0 / objf_info->tot_weight);
         diff.AddVec(1.0/ num_segments, new_dotprod);
         diff.AddVec(-1.0 / num_segments, old_dotprod);
         KALDI_VLOG(1) << "By segment " << s << ", objf change is "
                       << PrintVectorPerUpdatableComponent(nnet1, diff);
       }
       KALDI_LOG << "Total objf change per component is "
                 << PrintVectorPerUpdatableComponent(nnet1, diff);
     }

     { // Get info about magnitude of parameter change.
       Nnet diff_nnet(nnet1);
       AddNnet(nnet2, -1.0, &diff_nnet);
       if (GetVerboseLevel() >= 1) {
         KALDI_VLOG(1) << "Printing info for the difference between the neural nets: "
                       << diff_nnet.Info();
       }
       int32 num_updatable = NumUpdatableComponents(diff_nnet);
       Vector<BaseFloat> dot_prod(num_updatable);
       ComponentDotProducts(diff_nnet, diff_nnet, &dot_prod);
       dot_prod.ApplyPow(0.5); // take sqrt to get l2 norm of diff
       KALDI_LOG << "Parameter differences per layer are "
                 << PrintVectorPerUpdatableComponent(nnet1, dot_prod);

       Vector<BaseFloat> baseline_prod(num_updatable),
           new_prod(num_updatable);
       ComponentDotProducts(nnet1, nnet1, &baseline_prod);
       ComponentDotProducts(nnet2, nnet2, &new_prod);
       baseline_prod.ApplyPow(0.5);
       new_prod.ApplyPow(0.5);

       KALDI_LOG << "Norms of parameter matrices from <new-nnet-in> are "
                 << PrintVectorPerUpdatableComponent(nnet2, new_prod);

       dot_prod.DivElements(baseline_prod);
       KALDI_LOG << "Relative parameter differences per layer are "
                 << PrintVectorPerUpdatableComponent(nnet1, dot_prod);
     }
 #if HAVE_CUDA==1
     CuDevice::Instantiate().PrintProfile();
 #endif
     return 0;
   } catch(const std::exception &e) {
     std::cerr << e.what() << '\n';
     return -1;
   }
 }
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::ScaleNnet
void ScaleNnet(BaseFloat scale, Nnet *nnet)
Scales the nnet parameters and stats by this scale.
Definition: nnet-utils.cc:312

kaldi::nnet3::NnetComputeProb::GetDeriv
const Nnet & GetDeriv() const
Definition: nnet-diagnostics.cc:58

kaldi::nnet3::PrintVectorPerUpdatableComponent
std::string PrintVectorPerUpdatableComponent(const Nnet &nnet, const VectorBase< BaseFloat > &vec)
This function is for printing, to a string, a vector with one element per updatable component of the ...
Definition: nnet-utils.cc:231

kaldi::nnet3::ComponentDotProducts
void ComponentDotProducts(const Nnet &nnet1, const Nnet &nnet2, VectorBase< BaseFloat > *dot_prod)
Returns dot products between two networks of the same structure (calls the DotProduct functions of th...
Definition: nnet-utils.cc:211

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::GetVerboseLevel
int32 GetVerboseLevel()
Get verbosity level, usually set via command line &#39;–verbose=&#39; switch.
Definition: kaldi-error.h:60

kaldi::nnet3::NnetComputeProb::Compute
void Compute(const NnetExample &eg)
Definition: nnet-diagnostics.cc:79

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::nnet3::NnetComputeProb
This class is for computing cross-entropy and accuracy values in a neural network, for diagnostics.
Definition: nnet-diagnostics.h:107

kaldi::nnet3
Definition: dnn3_code_compilation.dox:22

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::nnet3::NnetComputeProb::PrintTotalStats
bool PrintTotalStats() const
Definition: nnet-diagnostics.cc:149

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

nnet-utils.h
This file contains some miscellaneous functions dealing with class Nnet.

kaldi::nnet3::Nnet::Info
std::string Info() const
returns some human-readable information about the network, mostly for debugging purposes.
Definition: nnet-nnet.cc:821

kaldi::nnet3::SimpleObjectiveInfo::tot_weight
double tot_weight
Definition: nnet-diagnostics.h:35

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::nnet3::NumParameters
int32 NumParameters(const Nnet &src)
Returns the total of the number of parameters in the updatable components of the nnet.
Definition: nnet-utils.cc:359

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

kaldi::nnet3::NnetComputeProbOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-diagnostics.h:76

transition-model.h

kaldi::nnet3::NnetComputeProbOptions
Definition: nnet-diagnostics.h:55

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::nnet3::NnetComputeProbOptions::compute_deriv
bool compute_deriv
Definition: nnet-diagnostics.h:57

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::VectorBase::Scale
void Scale(Real alpha)
Multiplies all elements by this constant.
Definition: kaldi-vector.cc:963

kaldi::nnet3::NnetComputeProb::GetObjective
const SimpleObjectiveInfo * GetObjective(const std::string &output_name) const
Definition: nnet-diagnostics.cc:299

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

kaldi::nnet3::IsSimpleNnet
bool IsSimpleNnet(const Nnet &nnet)
This function returns true if the nnet has the following properties: It has an output called "output"...
Definition: nnet-utils.cc:52

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

kaldi::VectorBase::ApplyPow
void ApplyPow(Real power)
Take all elements of vector to a power.
Definition: kaldi-vector.h:179

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::VectorBase::DivElements
void DivElements(const VectorBase< Real > &v)
Divide element-by-element by a vector.
Definition: kaldi-vector.cc:1011

kaldi::nnet3::SimpleObjectiveInfo::tot_objective
double tot_objective
Definition: nnet-diagnostics.h:36

kaldi::nnet3::SimpleObjectiveInfo
Definition: nnet-diagnostics.h:34

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::VectorBase::AddVec
void AddVec(const Real alpha, const VectorBase< OtherReal > &v)
Add vector : *this = *this + alpha * rv (with casting between floats and doubles) ...
Definition: kaldi-vector.cc:1044

kaldi-common.h

nnet-diagnostics.h

kaldi::nnet3::NumUpdatableComponents
int32 NumUpdatableComponents(const Nnet &dest)
Returns the number of updatable components in the nnet.
Definition: nnet-utils.cc:422

kaldi::ParseOptions::GetOptArg
std::string GetOptArg(int param) const
Definition: parse-options.h:127

kaldi::nnet3::AddNnet
void AddNnet(const Nnet &src, BaseFloat alpha, Nnet *dest)
Does *dest += alpha * src (affects nnet parameters and stored stats).
Definition: nnet-utils.cc:349

main
int main(int argc, char *argv[])
Definition: nnet3-show-progress.cc:27