doc/nnet3-discriminative-compute-from-egs_8cc_source.html

 // nnet3bin/nnet3-discriminative-compute-from-egs.cc

 // Copyright 2015  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "hmm/transition-model.h"
 #include "nnet3/nnet-nnet.h"
 #include "nnet3/nnet-example-utils.h"
 #include "nnet3/nnet-discriminative-example.h"
 #include "nnet3/nnet-optimize.h"


 namespace kaldi {
 namespace nnet3 {

 class NnetComputerFromEg {
  public:
   NnetComputerFromEg(const Nnet &nnet):
       nnet_(nnet), compiler_(nnet) { }

   // Compute the output (which will have the same number of rows as the number
   // of Indexes in the output of the eg), and put it in "output".
   void Compute(const NnetExample &eg, Matrix<BaseFloat> *output) {
     ComputationRequest request;
     bool need_backprop = false, store_stats = false;
     GetComputationRequest(nnet_, eg, need_backprop, store_stats, &request);
     const NnetComputation &computation = *(compiler_.Compile(request));
     NnetComputeOptions options;
     if (GetVerboseLevel() >= 3)
       options.debug = true;
     NnetComputer computer(options, computation, nnet_, NULL);
     computer.AcceptInputs(nnet_, eg.io);
     computer.Run();
     const CuMatrixBase<BaseFloat> &nnet_output = computer.GetOutput("output");
     output->Resize(nnet_output.NumRows(), nnet_output.NumCols());
     nnet_output.CopyToMat(output);
   }
  private:
   const Nnet &nnet_;
   CachingOptimizingCompiler compiler_;

 };

 }
 }

 int main(int argc, char *argv[]) {
   try {
     using namespace kaldi;
     using namespace kaldi::nnet3;
     typedef kaldi::int32 int32;
     typedef kaldi::int64 int64;

     const char *usage =
         "Read input nnet discriminative training examples, and compute the "
         "output for each one. This program is similar to "
         "nnet3-compute-from-egs, but works with discriminative egs. \n"
         "If --apply-exp=true, apply the Exp() function to the output before writing\n"
         "it out.\n"
         "Note: This program uses only the input; it does not do forward-backward\n"
         "over the lattice. See nnet3-discriminative-compute-objf for that.\n"
         "\n"
         "Usage:  nnet3-discriminative-compute-from-egs [options] <raw-nnet-in> <training-examples-in> <matrices-out>\n"
         "e.g.:\n"
         "nnet3-discriminative-compute-from-egs --apply-exp=true 0.raw ark:1.degs ark:- | matrix-sum-rows ark:- ... \n"
         "See also: nnet3-compute nnet3-compute-from-egs\n";

     bool binary_write = true,
         apply_exp = false;
     std::string use_gpu = "yes";

     ParseOptions po(usage);
     po.Register("binary", &binary_write, "Write output in binary mode");
     po.Register("apply-exp", &apply_exp, "If true, apply exp function to "
                 "output");
     po.Register("use-gpu", &use_gpu,
                 "yes|no|optional|wait, only has effect if compiled with CUDA");

     po.Read(argc, argv);

     if (po.NumArgs() != 3) {
       po.PrintUsage();
       exit(1);
     }

 #if HAVE_CUDA==1
     CuDevice::Instantiate().SelectGpuId(use_gpu);
 #endif

     std::string nnet_rxfilename = po.GetArg(1),
         examples_rspecifier = po.GetArg(2),
         matrix_wspecifier = po.GetArg(3);

     Nnet nnet;
     ReadKaldiObject(nnet_rxfilename, &nnet);

     NnetComputerFromEg computer(nnet);

     int64 num_egs = 0;

     SequentialNnetDiscriminativeExampleReader example_reader(examples_rspecifier);
     BaseFloatMatrixWriter matrix_writer(matrix_wspecifier);

     for (; !example_reader.Done(); example_reader.Next(), num_egs++) {
       Matrix<BaseFloat> output;
       NnetExample eg;
       NnetDiscriminativeExample disc_eg = example_reader.Value();
       eg.io.swap(disc_eg.inputs);

       for (int32 i = 0; i < disc_eg.outputs.size(); i++) {
         NnetIo io;
         io.name = disc_eg.outputs[i].name;
         io.indexes = disc_eg.outputs[i].indexes;
         eg.io.push_back(io);
       }

       computer.Compute(eg, &output);
       KALDI_ASSERT(output.NumRows() != 0);
       if (apply_exp)
         output.ApplyExp();
       matrix_writer.Write(example_reader.Key(), output);
     }
 #if HAVE_CUDA==1
     CuDevice::Instantiate().PrintProfile();
 #endif
     KALDI_LOG << "Processed " << num_egs << " examples.";
     return 0;
   } catch(const std::exception &e) {
     std::cerr << e.what() << '\n';
     return -1;
   }
 }
kaldi::nnet3::NnetExample
NnetExample is the input data and corresponding label (or labels) for one or more frames of input...
Definition: nnet-example.h:111

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::NnetIo
Definition: nnet-example.h:33

kaldi::nnet3::NnetComputerFromEg::nnet_
const Nnet & nnet_
Definition: nnet3-compute-from-egs.cc:58

nnet-nnet.h

kaldi::CuMatrixBase::CopyToMat
void CopyToMat(MatrixBase< OtherReal > *dst, MatrixTransposeType trans=kNoTrans) const
Definition: cu-matrix.cc:447

kaldi::nnet3::NnetComputerFromEg::compiler_
CachingOptimizingCompiler compiler_
Definition: nnet3-compute-from-egs.cc:59

main
int main(int argc, char *argv[])
Definition: nnet3-discriminative-compute-from-egs.cc:63

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::SequentialTableReader::Key
std::string Key()
Definition: kaldi-table-inl.h:918

kaldi::GetVerboseLevel
int32 GetVerboseLevel()
Get verbosity level, usually set via command line &#39;–verbose=&#39; switch.
Definition: kaldi-error.h:60

kaldi::nnet3::CachingOptimizingCompiler
This class enables you to do the compilation and optimization in one call, and also ensures that if t...
Definition: nnet-optimize.h:219

kaldi::nnet3::NnetComputeOptions::debug
bool debug
Definition: nnet-compute.h:40

kaldi::TableWriter
A templated class for writing objects to an archive or script file; see The Table concept...
Definition: kaldi-table.h:368

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::Matrix< BaseFloat >

kaldi::nnet3::NnetIo::indexes
std::vector< Index > indexes
"indexes" is a vector the same length as features.NumRows(), explaining the meaning of each row of th...
Definition: nnet-example.h:42

kaldi::nnet3::NnetComputerFromEg::Compute
void Compute(const NnetExample &eg, Matrix< BaseFloat > *output)
Definition: nnet3-discriminative-compute-from-egs.cc:39

kaldi::TableWriter::Write
void Write(const std::string &key, const T &value) const
Definition: kaldi-table-inl.h:1511

kaldi::nnet3
Definition: dnn3_code_compilation.dox:22

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::nnet3::NnetComputeOptions
Definition: nnet-compute.h:39

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

nnet-optimize.h

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

transition-model.h

kaldi::nnet3::NnetComputer::AcceptInputs
void AcceptInputs(const Nnet &nnet, const std::vector< NnetIo > &io)
This convenience function calls AcceptInput() in turn on all the inputs in the training example...
Definition: nnet-compute.cc:663

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

nnet-example-utils.h

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::nnet3::NnetComputerFromEg::NnetComputerFromEg
NnetComputerFromEg(const Nnet &nnet)
Definition: nnet3-discriminative-compute-from-egs.cc:34

kaldi::MatrixBase::ApplyExp
void ApplyExp()
Definition: kaldi-matrix.h:362

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::CachingOptimizingCompiler::Compile
std::shared_ptr< const NnetComputation > Compile(const ComputationRequest &request)
Does the compilation and returns a const pointer to the result, which is owned by this class...
Definition: nnet-optimize.cc:716

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

nnet-discriminative-example.h

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::nnet3::NnetComputer
class NnetComputer is responsible for executing the computation described in the "computation" object...
Definition: nnet-compute.h:59

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

kaldi::nnet3::NnetComputation
Definition: nnet-computation.h:303

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::nnet3::NnetDiscriminativeExample::inputs
std::vector< NnetIo > inputs
&#39;inputs&#39; contains the input to the network– normally just it has just one element called "input"...
Definition: nnet-discriminative-example.h:108

kaldi::nnet3::NnetDiscriminativeExample::outputs
std::vector< NnetDiscriminativeSupervision > outputs
&#39;outputs&#39; contains the sequence output supervision.
Definition: nnet-discriminative-example.h:112

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::nnet3::NnetIo::name
std::string name
the name of the input in the neural net; in simple setups it will just be "input".
Definition: nnet-example.h:36

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::nnet3::NnetExample::io
std::vector< NnetIo > io
"io" contains the input and output.
Definition: nnet-example.h:116

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi-common.h

kaldi::nnet3::NnetDiscriminativeExample
NnetDiscriminativeExample is like NnetExample, but specialized for sequence training.
Definition: nnet-discriminative-example.h:103

kaldi::nnet3::GetComputationRequest
void GetComputationRequest(const Nnet &nnet, const NnetExample &eg, bool need_model_derivative, bool store_component_stats, ComputationRequest *request)
This function takes a NnetExample (which should already have been frame-selected, if desired...
Definition: nnet-example-utils.cc:202