doc/nnet-compute-from-egs_8cc_source.html

 // nnet2bin/nnet-compute-from-egs.cc

 // Copyright 2012-2013  Johns Hopkins University (author:  Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "hmm/transition-model.h"
 #include "nnet2/train-nnet.h"
 #include "nnet2/am-nnet.h"


 int main(int argc, char *argv[]) {
   try {
     using namespace kaldi;
     using namespace kaldi::nnet2;
     typedef kaldi::int32 int32;
     typedef kaldi::int64 int64;

     const char *usage =
         "Does the neural net computation, taking as input the nnet-training examples\n"
         "(typically an archive with the extension .egs), ignoring the labels; it\n"
         "outputs as a matrix the result.  Used mostly for debugging.\n"
         "\n"
         "Usage:  nnet-compute-from-egs [options] <raw-nnet-in> <egs-rspecifier> "
         "<feature-wspecifier>\n"
         "e.g.:  nnet-compute-from-egs 'nnet-to-raw-nnet final.mdl -|' egs.10.1.ark ark:-\n";

     ParseOptions po(usage);

     po.Read(argc, argv);

     if (po.NumArgs() != 3) {
       po.PrintUsage();
       exit(1);
     }

     std::string raw_nnet_rxfilename = po.GetArg(1),
         examples_rspecifier = po.GetArg(2),
         features_or_loglikes_wspecifier = po.GetArg(3);

     Nnet nnet;
     ReadKaldiObject(raw_nnet_rxfilename, &nnet);

     int64 num_egs = 0;

     SequentialNnetExampleReader example_reader(examples_rspecifier);
     BaseFloatMatrixWriter writer(features_or_loglikes_wspecifier);

     int32 left_context = nnet.LeftContext(),
         context = nnet.LeftContext() + 1 + nnet.RightContext();

     for (; !example_reader.Done(); example_reader.Next()) {
       const NnetExample &eg = example_reader.Value();
       int32 start_offset = eg.left_context - left_context;
       int32 basic_dim = eg.input_frames.NumCols(),
           spk_dim = eg.spk_info.Dim(), dim = basic_dim + spk_dim;
       Matrix<BaseFloat> input_frames(eg.input_frames),
           input_block(context, dim);
       input_block.Range(0, context, 0, basic_dim).CopyFromMat(
           input_frames.Range(start_offset, context, 0, basic_dim));
       if (spk_dim != 0) {
         input_block.Range(0, context, basic_dim, spk_dim).CopyRowsFromVec(
             eg.spk_info);
       }
       CuMatrix<BaseFloat> gpu_input_block;
       gpu_input_block.Swap(&input_block);
       CuMatrix<BaseFloat> gpu_output_block(1, nnet.OutputDim());

       bool pad_input = false;
       NnetComputation(nnet, gpu_input_block, pad_input, &gpu_output_block);
       writer.Write("global", Matrix<BaseFloat>(gpu_output_block));
       num_egs++;
     }

     KALDI_LOG << "Processed " << num_egs << " examples.";

     return (num_egs == 0 ? 1 : 0);
   } catch(const std::exception &e) {
     std::cerr << e.what() << '\n';
     return -1;
   }
 }


kaldi::nnet2::NnetExample::input_frames
CompressedMatrix input_frames
The input data, with NumRows() >= labels.size() + left_context; it includes features to the left and ...
Definition: nnet-example.h:49

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet2::Nnet::LeftContext
int32 LeftContext() const
Returns the left-context summed over all the Components...
Definition: nnet-nnet.cc:42

kaldi::nnet2::NnetExample
NnetExample is the input data and corresponding label (or labels) for one or more frames of input...
Definition: nnet-example.h:36

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::nnet2::NnetExample::left_context
int32 left_context
The number of frames of left context (we can work out the #frames of right context from input_frames...
Definition: nnet-example.h:53

kaldi::nnet2::Nnet::OutputDim
int32 OutputDim() const
The output dimension of the network – typically the number of pdfs.
Definition: nnet-nnet.cc:31

kaldi::TableWriter
A templated class for writing objects to an archive or script file; see The Table concept...
Definition: kaldi-table.h:368

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::Matrix< BaseFloat >

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet2::NnetComputation
void NnetComputation(const Nnet &nnet, const CuMatrixBase< BaseFloat > &input, bool pad_input, CuMatrixBase< BaseFloat > *output)
Does the basic neural net computation, on a sequence of data (e.g.
Definition: nnet-compute.cc:160

kaldi::TableWriter::Write
void Write(const std::string &key, const T &value) const
Definition: kaldi-table-inl.h:1511

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

am-nnet.h

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

transition-model.h

kaldi::CuMatrix::Swap
void Swap(Matrix< Real > *mat)
Definition: cu-matrix.cc:123

kaldi::nnet2::Nnet::RightContext
int32 RightContext() const
Returns the right-context summed over all the Components...
Definition: nnet-nnet.cc:56

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

main
int main(int argc, char *argv[])
Definition: nnet-compute-from-egs.cc:27

kaldi::nnet2::Nnet
Definition: nnet-nnet.h:63

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

kaldi::MatrixBase::Range
SubMatrix< Real > Range(const MatrixIndexT row_offset, const MatrixIndexT num_rows, const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Return a sub-part of matrix.
Definition: kaldi-matrix.h:202

kaldi::nnet2
Definition: am-nnet-test.cc:26

train-nnet.h

kaldi::CompressedMatrix::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for emtpy matrix).
Definition: compressed-matrix.h:150

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi-common.h

kaldi::nnet2::NnetExample::spk_info
Vector< BaseFloat > spk_info
The speaker-specific input, if any, or an empty vector if we&#39;re not using this features.
Definition: nnet-example.h:58