doc/nnet-train-mpe-sequential_8cc_source.html

 // nnetbin/nnet-train-mpe-sequential.cc

 // Copyright 2011-2016  Brno University of Technology (author: Karel Vesely);
 //                      Arnab Ghoshal

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "tree/context-dep.h"
 #include "hmm/transition-model.h"
 #include "fstext/fstext-lib.h"
 #include "decoder/faster-decoder.h"
 #include "decoder/decodable-matrix.h"
 #include "lat/kaldi-lattice.h"
 #include "lat/lattice-functions.h"

 #include "nnet/nnet-trnopts.h"
 #include "nnet/nnet-component.h"
 #include "nnet/nnet-activation.h"
 #include "nnet/nnet-nnet.h"
 #include "nnet/nnet-pdf-prior.h"
 #include "nnet/nnet-utils.h"
 #include "base/timer.h"
 #include "cudamatrix/cu-device.h"


 namespace kaldi {
 namespace nnet1 {

 void LatticeAcousticRescore(const Matrix<BaseFloat> &log_like,
                             const TransitionModel &trans_model,
                             const std::vector<int32> &state_times,
                             Lattice *lat) {
   kaldi::uint64 props = lat->Properties(fst::kFstProperties, false);
   if (!(props & fst::kTopSorted))
     KALDI_ERR << "Input lattice must be topologically sorted.";

   KALDI_ASSERT(!state_times.empty());
   std::vector<std::vector<int32> > time_to_state(log_like.NumRows());
   for (size_t i = 0; i < state_times.size(); i++) {
     KALDI_ASSERT(state_times[i] >= 0);
     if (state_times[i] < log_like.NumRows())  // end state may be past this..
       time_to_state[state_times[i]].push_back(i);
     else
       KALDI_ASSERT(state_times[i] == log_like.NumRows()
                    && "There appears to be lattice/feature mismatch.");
   }

   for (int32 t = 0; t < log_like.NumRows(); t++) {
     for (size_t i = 0; i < time_to_state[t].size(); i++) {
       int32 state = time_to_state[t][i];
       for (fst::MutableArcIterator<Lattice> aiter(lat, state); !aiter.Done();
            aiter.Next()) {
         LatticeArc arc = aiter.Value();
         int32 trans_id = arc.ilabel;
         if (trans_id != 0) {  // Non-epsilon input label on arc
           int32 pdf_id = trans_model.TransitionIdToPdf(trans_id);
           arc.weight.SetValue2(-log_like(t, pdf_id) + arc.weight.Value2());
           aiter.SetValue(arc);
         }
       }
     }
   }
 }

 }  // namespace nnet1
 }  // namespace kaldi


 int main(int argc, char *argv[]) {
   using namespace kaldi;
   using namespace kaldi::nnet1;
   typedef kaldi::int32 int32;
   try {
     const char *usage =
       "Perform one iteration of MPE/sMBR training using SGD with per-utterance"
       "updates.\n"

       "Usage:  nnet-train-mpe-sequential [options] "
       "<model-in> <transition-model-in> <feature-rspecifier> "
       "<den-lat-rspecifier> <ali-rspecifier> [<model-out>]\n"

       "e.g.: nnet-train-mpe-sequential nnet.init trans.mdl scp:feats.scp "
       "scp:denlats.scp ark:ali.ark nnet.iter1\n";

     ParseOptions po(usage);

     NnetTrainOptions trn_opts;
     trn_opts.learn_rate = 0.00001;  // changing default,
     trn_opts.Register(&po);

     bool binary = true;
     po.Register("binary", &binary, "Write output in binary mode");

     std::string feature_transform;
     po.Register("feature-transform", &feature_transform,
                 "Feature transform in 'nnet1' format");

     std::string silence_phones_str;
     po.Register("silence-phones", &silence_phones_str,
         "Colon-separated list of integer id's of silence phones, e.g. 46:47");

     PdfPriorOptions prior_opts;
     prior_opts.Register(&po);

     BaseFloat acoustic_scale = 1.0,
         lm_scale = 1.0,
         old_acoustic_scale = 0.0;

     po.Register("acoustic-scale", &acoustic_scale,
         "Scaling factor for acoustic likelihoods");

     po.Register("lm-scale", &lm_scale,
         "Scaling factor for \"graph costs\" (including LM costs)");

     po.Register("old-acoustic-scale", &old_acoustic_scale,
         "Add in the scores in the input lattices with this scale, rather "
         "than discarding them.");

     bool one_silence_class = false;
     po.Register("one-silence-class", &one_silence_class,
         "If true, the newer behavior reduces insertions.");

     kaldi::int32 max_frames = 6000;
     po.Register("max-frames", &max_frames,
         "Maximum number of frames an utterance can have (skipped if longer)");

     bool do_smbr = false;
     po.Register("do-smbr", &do_smbr,
         "Use state-level accuracies instead of phone accuracies.");

     std::string use_gpu="yes";
     po.Register("use-gpu", &use_gpu,
         "yes|no|optional, only has effect if compiled with CUDA");

     po.Read(argc, argv);

     if (po.NumArgs() != 6) {
       po.PrintUsage();
       exit(1);
     }

     std::string model_filename = po.GetArg(1),
         transition_model_filename = po.GetArg(2),
         feature_rspecifier = po.GetArg(3),
         den_lat_rspecifier = po.GetArg(4),
         ref_ali_rspecifier = po.GetArg(5),
         target_model_filename = po.GetArg(6);

     std::vector<int32> silence_phones;
     if (!kaldi::SplitStringToIntegers(silence_phones_str, ":", false,
                                       &silence_phones)) {
       KALDI_ERR << "Invalid silence-phones string " << silence_phones_str;
     }
     kaldi::SortAndUniq(&silence_phones);
     if (silence_phones.empty()) {
       KALDI_LOG << "No silence phones specified.";
     }

 #if HAVE_CUDA == 1
     CuDevice::Instantiate().SelectGpuId(use_gpu);
 #endif

     Nnet nnet_transf;
     if (feature_transform != "") {
       nnet_transf.Read(feature_transform);
     }

     Nnet nnet;
     nnet.Read(model_filename);
     // we will use pre-softmax activations, removing softmax,
     // - pre-softmax activations are equivalent to 'log-posterior + C_frame',
     // - all paths crossing a frame share same 'C_frame',
     // - with GMM, we also have the unnormalized acoustic likelihoods,
     if (nnet.GetLastComponent().GetType() ==
         kaldi::nnet1::Component::kSoftmax) {
       KALDI_LOG << "Removing softmax from the nnet " << model_filename;
       nnet.RemoveLastComponent();
     } else {
       KALDI_LOG << "The nnet was without softmax. "
                 << "The last component in " << model_filename << " was "
                 << Component::TypeToMarker(nnet.GetLastComponent().GetType());
     }
     nnet.SetTrainOptions(trn_opts);

     // Read the class-frame-counts, compute priors,
     PdfPrior log_prior(prior_opts);

     // Read transition model,
     TransitionModel trans_model;
     ReadKaldiObject(transition_model_filename, &trans_model);

     SequentialBaseFloatMatrixReader feature_reader(feature_rspecifier);
     RandomAccessLatticeReader den_lat_reader(den_lat_rspecifier);
     RandomAccessInt32VectorReader ref_ali_reader(ref_ali_rspecifier);

     CuMatrix<BaseFloat> feats_transf, nnet_out, nnet_diff;
     Matrix<BaseFloat> nnet_out_h;

     Timer time;
     double time_now = 0;
     KALDI_LOG << "TRAINING STARTED";

     int32 num_done = 0,
           num_no_ref_ali = 0,
           num_no_den_lat = 0,
           num_other_error = 0;

     kaldi::int64 total_frames = 0;
     double total_frame_acc = 0.0, utt_frame_acc;

     // main loop over utterances,
     for (; !feature_reader.Done(); feature_reader.Next()) {
       std::string utt = feature_reader.Key();
       if (!den_lat_reader.HasKey(utt)) {
         KALDI_WARN << "Missing lattice for " << utt;
         num_no_den_lat++;
         continue;
       }
       if (!ref_ali_reader.HasKey(utt)) {
         KALDI_WARN << "Missing alignment for " << utt;
         num_no_ref_ali++;
         continue;
       }

       // 1) get the features, numerator alignment,
       const Matrix<BaseFloat> &mat = feature_reader.Value();
       const std::vector<int32> &ref_ali = ref_ali_reader.Value(utt);
       // check duration of numerator alignments,
       if (static_cast<MatrixIndexT>(ref_ali.size()) != mat.NumRows()) {
         KALDI_WARN << "Duration mismatch!"
                    << " alignment " << ref_ali.size()
                    << " features " << mat.NumRows();
         num_other_error++;
         continue;
       }
       if (mat.NumRows() > max_frames) {
         KALDI_WARN << "Skipping " << utt
           << " that has " << mat.NumRows() << " frames,"
           << " it is longer than '--max-frames'" << max_frames;
         num_other_error++;
         continue;
       }

       // 2) get the denominator lattice, preprocess
       Lattice den_lat = den_lat_reader.Value(utt);
       if (den_lat.Start() == -1) {
         KALDI_WARN << "Empty lattice of " << utt << ", skipping.";
         num_other_error++;
         continue;
       }
       if (old_acoustic_scale != 1.0) {
         fst::ScaleLattice(fst::AcousticLatticeScale(old_acoustic_scale),
                           &den_lat);
       }
       // optional sort it topologically
       kaldi::uint64 props = den_lat.Properties(fst::kFstProperties, false);
       if (!(props & fst::kTopSorted)) {
         if (fst::TopSort(&den_lat) == false) {
           KALDI_ERR << "Cycles detected in lattice.";
         }
       }
       // get the lattice length and times of states
       std::vector<int32> state_times;
       int32 max_time = kaldi::LatticeStateTimes(den_lat, &state_times);
       // check for temporal length of denominator lattices
       if (max_time != mat.NumRows()) {
         KALDI_WARN << "Duration mismatch!"
           << " denominator lattice " << max_time
           << " features " << mat.NumRows() << ","
           << " skipping " << utt;
         num_other_error++;
         continue;
       }

       // get dims,
       int32 num_frames = mat.NumRows();

       // 3) get the pre-softmax outputs from NN,
       // apply transform,
       nnet_transf.Feedforward(CuMatrix<BaseFloat>(mat), &feats_transf);
       // propagate through the nnet (we know it's w/o softmax),
       nnet.Propagate(feats_transf, &nnet_out);
       // subtract the log_prior,
       if (prior_opts.class_frame_counts != "") {
         log_prior.SubtractOnLogpost(&nnet_out);
       }
       // transfer it back to the host,
       nnet_out_h = Matrix<BaseFloat>(nnet_out);
       // release the buffers we don't need anymore
       feats_transf.Resize(0, 0);
       nnet_out.Resize(0, 0);

       // 4) rescore the latice
       LatticeAcousticRescore(nnet_out_h, trans_model, state_times, &den_lat);
       if (acoustic_scale != 1.0 || lm_scale != 1.0)
         fst::ScaleLattice(fst::LatticeScale(lm_scale, acoustic_scale), &den_lat);

       kaldi::Posterior post;
       if (do_smbr) {
         // use state-level accuracies, i.e. sMBR estimation,
         utt_frame_acc = LatticeForwardBackwardMpeVariants(
             trans_model, silence_phones, den_lat, ref_ali, "smbr",
             one_silence_class, &post);
       } else {
         // use phone-level accuracies, i.e. MPFE (minimum phone frame error),
         utt_frame_acc = LatticeForwardBackwardMpeVariants(
             trans_model, silence_phones, den_lat, ref_ali, "mpfe",
             one_silence_class, &post);
       }

       // 6) convert the Posterior to a matrix,
       PosteriorToPdfMatrix(post, trans_model, &nnet_diff);
       nnet_diff.Scale(-1.0);  // need to flip the sign of derivative,

       KALDI_VLOG(1) << "Lattice #" << num_done + 1 << " processed"
                     << " (" << utt << "): found " << den_lat.NumStates()
                     << " states and " << fst::NumArcs(den_lat) << " arcs.";

       KALDI_VLOG(1) << "Utterance " << utt << ": Average frame accuracy = "
                     << (utt_frame_acc/num_frames) << " over " << num_frames
                     << " frames,"
                     << " diff-range(" << nnet_diff.Min() << ","
                                       << nnet_diff.Max() << ")";

       // 7) backpropagate through the nnet, update,
       nnet.Backpropagate(nnet_diff, NULL);
       nnet_diff.Resize(0, 0);  // release GPU memory,

       // increase time counter
       total_frame_acc += utt_frame_acc;
       total_frames += num_frames;
       num_done++;

       if (num_done % 100 == 0) {
         time_now = time.Elapsed();
         KALDI_VLOG(1) << "After " << num_done << " utterances: "
           << "time elapsed = " << time_now / 60 << " min; "
           << "processed " << total_frames / time_now << " frames per sec.";
 #if HAVE_CUDA == 1
         // check that GPU computes accurately,
         CuDevice::Instantiate().CheckGpuHealth();
 #endif
       }

       // GRADIENT LOGGING
       // First utterance,
       if (num_done == 1) {
         KALDI_VLOG(1) << nnet.InfoPropagate();
         KALDI_VLOG(1) << nnet.InfoBackPropagate();
         KALDI_VLOG(1) << nnet.InfoGradient();
       }
       // Every 1000 utterances (--verbose=2),
       if (GetVerboseLevel() >= 2) {
         if (num_done % 1000 == 0) {
           KALDI_VLOG(2) << nnet.InfoPropagate();
           KALDI_VLOG(2) << nnet.InfoBackPropagate();
           KALDI_VLOG(2) << nnet.InfoGradient();
         }
       }
     }  // main loop over utterances,

     // After last utterance,
     KALDI_VLOG(1) << nnet.InfoPropagate();
     KALDI_VLOG(1) << nnet.InfoBackPropagate();
     KALDI_VLOG(1) << nnet.InfoGradient();

     // Add the softmax layer back before writing,
     KALDI_LOG << "Appending the softmax " << target_model_filename;
     nnet.AppendComponentPointer(new Softmax(nnet.OutputDim(), nnet.OutputDim()));
     // Store the nnet,
     nnet.Write(target_model_filename, binary);

     time_now = time.Elapsed();
     KALDI_LOG << "TRAINING FINISHED; "
               << "Time taken = " << time_now / 60 << " min; processed "
               << total_frames / time_now << " frames per second.";

     KALDI_LOG << "Done " << num_done << " files, "
               << num_no_ref_ali << " with no reference alignments, "
               << num_no_den_lat << " with no lattices, "
               << num_other_error << " with other errors.";

     KALDI_LOG << "Overall average frame-accuracy is "
               << total_frame_acc / total_frames << " over "
               << total_frames << " frames.";

 #if HAVE_CUDA == 1
     CuDevice::Instantiate().PrintProfile();
 #endif

     return 0;
   } catch(const std::exception &e) {
     std::cerr << e.what();
     return -1;
   }
 }
kaldi::nnet1::Nnet::Backpropagate
void Backpropagate(const CuMatrixBase< BaseFloat > &out_diff, CuMatrix< BaseFloat > *in_diff)
Perform backward pass through the network,.
Definition: nnet-nnet.cc:96

kaldi::nnet1::PdfPriorOptions
Definition: nnet-pdf-prior.h:35

fstext-lib.h

kaldi::nnet1::Nnet::RemoveLastComponent
void RemoveLastComponent()
Remove the last of the Components,.
Definition: nnet-nnet.cc:206

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::PosteriorToPdfMatrix
void PosteriorToPdfMatrix(const Posterior &post, const TransitionModel &model, CuMatrix< Real > *mat)
Wrapper of PosteriorToMatrixMapped with CuMatrix argument.
Definition: nnet-utils.h:304

kaldi::nnet1::Component::kSoftmax
Definition: nnet-component.h:59

kaldi::nnet1::Nnet::AppendComponentPointer
void AppendComponentPointer(Component *dynamically_allocated_comp)
Append Component* to &#39;this&#39; instance of Nnet by a shallow copy (&#39;this&#39; instance of Nnet over-takes th...
Definition: nnet-nnet.cc:187

kaldi::nnet1::NnetTrainOptions::learn_rate
BaseFloat learn_rate
Definition: nnet-trnopts.h:32

kaldi::nnet1
Definition: dnn1.dox:21

kaldi::LatticeArc
fst::ArcTpl< LatticeWeight > LatticeArc
Definition: kaldi-lattice.h:40

kaldi::nnet1::Nnet::Propagate
void Propagate(const CuMatrixBase< BaseFloat > &in, CuMatrix< BaseFloat > *out)
Perform forward pass through the network,.
Definition: nnet-nnet.cc:70

kaldi::nnet1::PdfPriorOptions::class_frame_counts
std::string class_frame_counts
Definition: nnet-pdf-prior.h:36

kaldi::LatticeStateTimes
int32 LatticeStateTimes(const Lattice &lat, vector< int32 > *times)
This function iterates over the states of a topologically sorted lattice and counts the time instance...
Definition: lattice-functions.cc:78

cu-device.h

kaldi::SplitStringToIntegers
bool SplitStringToIntegers(const std::string &full, const char *delim, bool omit_empty_strings, std::vector< I > *out)
Split a string (e.g.
Definition: text-utils.h:68

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::SequentialTableReader::Key
std::string Key()
Definition: kaldi-table-inl.h:918

kaldi::GetVerboseLevel
int32 GetVerboseLevel()
Get verbosity level, usually set via command line &#39;–verbose=&#39; switch.
Definition: kaldi-error.h:60

kaldi::nnet1::Nnet::Write
void Write(const std::string &wxfilename, bool binary) const
Write Nnet to &#39;wxfilename&#39;,.
Definition: nnet-nnet.cc:367

faster-decoder.h

nnet-pdf-prior.h

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::CuMatrixBase::Min
void Min(const CuMatrixBase< Real > &A)
Do, elementwise, *this = min(*this, A).
Definition: cu-matrix.cc:740

nnet-component.h

kaldi::SortAndUniq
void SortAndUniq(std::vector< T > *vec)
Sorts and uniq&#39;s (removes duplicates) from a vector.
Definition: stl-utils.h:39

timer.h

kaldi::nnet1::PdfPrior::SubtractOnLogpost
void SubtractOnLogpost(CuMatrixBase< BaseFloat > *llk)
Subtract pdf priors from log-posteriors to get pseudo log-likelihoods.
Definition: nnet-pdf-prior.cc:76

kaldi::nnet1::Nnet::GetLastComponent
const Component & GetLastComponent() const
LastComponent accessor,.
Definition: nnet-nnet.cc:161

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

kaldi-lattice.h

lattice-functions.h

kaldi::RandomAccessTableReader
Allows random access to a collection of objects in an archive or script file; see The Table concept...
Definition: kaldi-table.h:233

main
int main(int argc, char *argv[])
Definition: nnet-train-mpe-sequential.cc:85

kaldi::nnet1::Component::TypeToMarker
static const char * TypeToMarker(ComponentType t)
Converts component type to marker,.
Definition: nnet-component.cc:84

kaldi::CuMatrixBase::Scale
void Scale(Real value)
Definition: cu-matrix.cc:644

fst::AcousticLatticeScale
std::vector< std::vector< double > > AcousticLatticeScale(double acwt)
Definition: lattice-utils.h:138

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

kaldi::CuMatrixBase::Max
void Max(const CuMatrixBase< Real > &A)
Do, elementwise, *this = max(*this, A).
Definition: cu-matrix.cc:715

kaldi::nnet1::Nnet::OutputDim
int32 OutputDim() const
Dimensionality of network outputs (posteriors | bn-features | etc.),.
Definition: nnet-nnet.cc:143

kaldi::RandomAccessTableReader::Value
const T & Value(const std::string &key)
Definition: kaldi-table-inl.h:2561

transition-model.h

kaldi::nnet1::Nnet::InfoBackPropagate
std::string InfoBackPropagate(bool header=true) const
Create string with back-propagation-buffer statistics,.
Definition: nnet-nnet.cc:443

fst::ScaleLattice
void ScaleLattice(const std::vector< std::vector< ScaleFloat > > &scale, MutableFst< ArcTpl< Weight > > *fst)
Scales the pairs of weights in LatticeWeight or CompactLatticeWeight by viewing the pair (a...
Definition: lattice-utils-inl.h:197

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

fst::LatticeScale
std::vector< std::vector< double > > LatticeScale(double lmwt, double acwt)
Definition: lattice-utils.h:156

kaldi::nnet1::Nnet
Definition: nnet-nnet.h:37

kaldi::Lattice
fst::VectorFst< LatticeArc > Lattice
Definition: kaldi-lattice.h:44

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::LatticeForwardBackwardMpeVariants
BaseFloat LatticeForwardBackwardMpeVariants(const TransitionModel &trans, const std::vector< int32 > &silence_phones, const Lattice &lat, const std::vector< int32 > &num_ali, std::string criterion, bool one_silence_class, Posterior *post)
This function implements either the MPFE (minimum phone frame error) or SMBR (state-level minimum bay...
Definition: lattice-functions.cc:794

kaldi::nnet1::Nnet::Read
void Read(const std::string &rxfilename)
Read Nnet from &#39;rxfilename&#39;,.
Definition: nnet-nnet.cc:333

kaldi::nnet1::PdfPrior
Definition: nnet-pdf-prior.h:59

kaldi::nnet1::NnetTrainOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-trnopts.h:46

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::RandomAccessTableReader::HasKey
bool HasKey(const std::string &key)
Definition: kaldi-table-inl.h:2551

kaldi::nnet1::Nnet::Feedforward
void Feedforward(const CuMatrixBase< BaseFloat > &in, CuMatrix< BaseFloat > *out)
Perform forward pass through the network (with 2 swapping buffers),.
Definition: nnet-nnet.cc:131

kaldi::Timer
Definition: timer.h:63

nnet-trnopts.h

kaldi::nnet1::Softmax
Definition: nnet-activation.h:37

kaldi::nnet1::NnetTrainOptions
Definition: nnet-trnopts.h:30

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

nnet-nnet.h

nnet-activation.h

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet1::Nnet::InfoGradient
std::string InfoGradient(bool header=true) const
Create string with per-component gradient statistics,.
Definition: nnet-nnet.cc:407

kaldi::nnet1::Nnet::InfoPropagate
std::string InfoPropagate(bool header=true) const
Create string with propagation-buffer statistics,.
Definition: nnet-nnet.cc:420

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::nnet1::Component::GetType
virtual ComponentType GetType() const =0
Get Type Identification of the component,.

kaldi::nnet1::Nnet::SetTrainOptions
void SetTrainOptions(const NnetTrainOptions &opts)
Set hyper-parameters of the training (pushes to all UpdatableComponents),.
Definition: nnet-nnet.cc:508

decodable-matrix.h

fst::NumArcs
Arc::StateId NumArcs(const ExpandedFst< Arc > &fst)
Returns the total number of arcs in an FST.
Definition: fstext-utils-inl.h:67

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

nnet-utils.h

context-dep.h

kaldi::Timer::Elapsed
double Elapsed() const
Returns time in seconds.
Definition: timer.h:74

kaldi-common.h

kaldi::CuMatrix::Resize
void Resize(MatrixIndexT rows, MatrixIndexT cols, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Allocate the memory.
Definition: cu-matrix.cc:50

kaldi::nnet1::PdfPriorOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-pdf-prior.h:46

kaldi::nnet1::LatticeAcousticRescore
void LatticeAcousticRescore(const Matrix< BaseFloat > &log_like, const TransitionModel &trans_model, const std::vector< int32 > &state_times, Lattice *lat)
Definition: nnet-train-mmi-sequential.cc:45