doc/nnet-compare-hash-discriminative_8cc_source.html

 // nnet2bin/nnet-compare-hash-discriminative.cc

 // Copyright 2012-2013  Johns Hopkins University (author:  Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "hmm/transition-model.h"
 #include "nnet2/nnet-example-functions.h"

 int main(int argc, char *argv[]) {
   try {
     using namespace kaldi;
     using namespace kaldi::nnet2;
     typedef kaldi::int32 int32;
     typedef kaldi::int64 int64;

     const char *usage =
         "Compares two archives of discriminative training examples and checks\n"
         "that they behave the same way for purposes of discriminative training.\n"
         "This program was created as a way of testing nnet-get-egs-discriminative\n"
         "The model is only needed for its transition-model.\n"
         "\n"
         "Usage:  nnet-compare-hash-discriminative [options] <model-rxfilename> "
         "<egs-rspecifier1> <egs-rspecifier2>\n"
         "\n"
         "Note: options --drop-frames and --criterion should be matched with the\n"
         "command line of nnet-get-egs-discriminative used to get the examples\n"
         "nnet-compare-hash-discriminative --drop-frames=true --criterion=mmi ark:1.degs ark:2.degs\n";

     std::string criterion = "smbr";
     bool drop_frames = false;
     bool one_silence_class = false;
     BaseFloat threshold = 0.002;
     BaseFloat acoustic_scale = 1.0, lm_scale = 1.0;
     ParseOptions po(usage);

     po.Register("acoustic-scale", &acoustic_scale,
                 "Scaling factor for acoustic likelihoods");
     po.Register("lm-scale", &lm_scale,
                 "Scaling factor for \"graph costs\" (including LM costs)");
     po.Register("criterion", &criterion, "Training criterion, 'mmi'|'mpfe'|'smbr'");
     po.Register("drop-frames", &drop_frames, "If true, for MMI training, drop "
                 "frames where num and den do not intersect.");
     po.Register("one-silence-class", &one_silence_class, "If true, newer "
                  "behavior which will tend to reduce insertions.");
     po.Register("threshold", &threshold, "Threshold for equality testing "
                 "(relative)");

     po.Read(argc, argv);


     if (po.NumArgs() != 3) {
       po.PrintUsage();
       exit(1);
     }

     std::string model_rxfilename = po.GetArg(1),
         examples_rspecifier1 = po.GetArg(2),
         examples_rspecifier2 = po.GetArg(3);

     int64 num_done1 = 0, num_done2 = 0;


     TransitionModel tmodel;
     ReadKaldiObject(model_rxfilename, &tmodel);

     Matrix<double> hash1, hash2;

     // some additional diagnostics:
     double num_weight1 = 0.0, den_weight1 = 0.0, tot_t1 = 0.0;
     double num_weight2 = 0.0, den_weight2 = 0.0, tot_t2 = 0.0;

     SequentialDiscriminativeNnetExampleReader
         example_reader1(examples_rspecifier1),
         example_reader2(examples_rspecifier2);

     KALDI_LOG << "Computing first hash function";
     for (; !example_reader1.Done(); example_reader1.Next(), num_done1++) {
       DiscriminativeNnetExample eg = example_reader1.Value();
       fst::ScaleLattice(fst::LatticeScale(lm_scale, acoustic_scale),
                         &(eg.den_lat));
       UpdateHash(tmodel, eg, criterion, drop_frames,
                  one_silence_class, &hash1,
                  &num_weight1, &den_weight1, &tot_t1);
     }
     KALDI_LOG << "Processed " << num_done1 << " examples.";

     KALDI_LOG << "Computing second hash function";
     for (; !example_reader2.Done(); example_reader2.Next(), num_done2++) {
       DiscriminativeNnetExample eg = example_reader2.Value();
       fst::ScaleLattice(fst::LatticeScale(lm_scale, acoustic_scale),
                         &(eg.den_lat));
       UpdateHash(tmodel, eg, criterion, drop_frames,
                  one_silence_class, &hash2,
                  &num_weight2, &den_weight2, &tot_t2);
     }
     KALDI_LOG << "Processed " << num_done2 << " examples.";

     double prod1 = TraceMatMat(hash1, hash1, kTrans),
         prod2 = TraceMatMat(hash2, hash2, kTrans),
         cross_prod = TraceMatMat(hash1, hash2, kTrans);

     KALDI_LOG << "Products are as follows (should be the same): prod1 = "
               << prod1 << ", prod2 = " << prod2 << ", cross_prod = "
               << cross_prod;

     KALDI_LOG << "Num-weight1 = " << num_weight1 << ", den-weight1 = "
               << den_weight1 << ", tot_t1 = " << tot_t1;
     KALDI_LOG << "Num-weight2 = " << num_weight2 << ", den-weight2 = "
               << den_weight2 << ", tot_t2 = " << tot_t2;

     KALDI_ASSERT(ApproxEqual(prod1, prod2, threshold) &&
                  ApproxEqual(prod2, cross_prod, threshold));
     KALDI_ASSERT(prod1 > 0.0);

     return 0;
   } catch(const std::exception &e) {
     std::cerr << e.what() << '\n';
     return -1;
   }
 }


kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

main
int main(int argc, char *argv[])
Definition: nnet-compare-hash-discriminative.cc:25

kaldi::nnet2::UpdateHash
void UpdateHash(const TransitionModel &tmodel, const DiscriminativeNnetExample &eg, std::string criterion, bool drop_frames, bool one_silence_class, Matrix< double > *hash, double *num_weight, double *den_weight, double *tot_t)
This function is used in code that tests the functionality that we provide here, about splitting and ...
Definition: nnet-example-functions.cc:786

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::Matrix< double >

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::TransitionModel
Definition: transition-model.h:123

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

transition-model.h

fst::ScaleLattice
void ScaleLattice(const std::vector< std::vector< ScaleFloat > > &scale, MutableFst< ArcTpl< Weight > > *fst)
Scales the pairs of weights in LatticeWeight or CompactLatticeWeight by viewing the pair (a...
Definition: lattice-utils-inl.h:197

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

fst::LatticeScale
std::vector< std::vector< double > > LatticeScale(double lmwt, double acwt)
Definition: lattice-utils.h:156

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

kaldi::nnet2::DiscriminativeNnetExample::den_lat
CompactLattice den_lat
The denominator lattice.
Definition: nnet-example.h:148

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::TraceMatMat
Real TraceMatMat(const MatrixBase< Real > &A, const MatrixBase< Real > &B, MatrixTransposeType trans)
We need to declare this here as it will be a friend function.
Definition: kaldi-matrix.cc:2692

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

kaldi::nnet2::DiscriminativeNnetExample
This struct is used to store the information we need for discriminative training (MMI or MPE)...
Definition: nnet-example.h:136

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet2
Definition: am-nnet-test.cc:26

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi-common.h

nnet-example-functions.h
Note on how to parse this filename: it contains functions relatied to neural-net training examples...

kaldi::ApproxEqual
static bool ApproxEqual(float a, float b, float relative_tolerance=0.001)
return abs(a - b) <= relative_tolerance * (abs(a)+abs(b)).
Definition: kaldi-math.h:265