doc/nnet-train-multistream_8cc_source.html

 // nnetbin/nnet-train-multistream.cc

 // Copyright 2015-2016  Brno University of Technology (Author: Karel Vesely)
 //           2014  Jiayu DU (Jerry), Wei Li

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <numeric>

 #include "nnet/nnet-trnopts.h"
 #include "nnet/nnet-nnet.h"
 #include "nnet/nnet-loss.h"
 #include "nnet/nnet-randomizer.h"
 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "base/timer.h"
 #include "cudamatrix/cu-device.h"


 namespace kaldi {

 bool ReadData(SequentialBaseFloatMatrixReader& feature_reader,
               RandomAccessPosteriorReader& target_reader,
               RandomAccessBaseFloatVectorReader& weights_reader,
               int32 length_tolerance,
               Matrix<BaseFloat>* feats,
               Posterior* targets,
               Vector<BaseFloat>* weights,
               int32* num_no_tgt_mat,
               int32* num_other_error) {

   // We're looking for the 1st valid utterance...
   for ( ; !feature_reader.Done(); feature_reader.Next()) {
     // Do we have targets?
     const std::string& utt = feature_reader.Key();
     KALDI_VLOG(3) << "Reading: " << utt;
     if (!target_reader.HasKey(utt)) {
       KALDI_WARN << utt << ", missing targets";
       (*num_no_tgt_mat)++;
       continue;
     }
     // Do we have frame-weights?
     if (weights_reader.IsOpen() && !weights_reader.HasKey(utt)) {
       KALDI_WARN << utt << ", missing frame-weights";
       (*num_other_error)++;
       continue;
     }

     // get the (feature,target) pair,
     (*feats) = feature_reader.Value();
     (*targets) = target_reader.Value(utt);

     // getting per-frame weights,
     if (weights_reader.IsOpen()) {
       (*weights) = weights_reader.Value(utt);
     } else {  // all per-frame weights are 1.0
       weights->Resize(feats->NumRows());
       weights->Set(1.0);
     }

     // correct small length mismatch ... or drop sentence
     {
       // add lengths to vector
       std::vector<int32> length;
       length.push_back(feats->NumRows());
       length.push_back(targets->size());
       length.push_back(weights->Dim());
       // find min, max
       int32 min = *std::min_element(length.begin(), length.end());
       int32 max = *std::max_element(length.begin(), length.end());
       // fix or drop ?
       if (max - min < length_tolerance) {
         if (feats->NumRows() != min) feats->Resize(min, feats->NumCols(), kCopyData);
         if (targets->size() != min) targets->resize(min);
         if (weights->Dim() != min) weights->Resize(min, kCopyData);
       } else {
         KALDI_WARN << "Length mismatch! Targets " << targets->size()
                    << ", features " << feats->NumRows() << ", " << utt;
         num_other_error++;
         continue;
       }
     }

     // By getting here we got a valid utterance,
     feature_reader.Next();
     return true;
   }

   // No more data,
   return false;
 }

 }  // namespace kaldi


 int main(int argc, char *argv[]) {
   using namespace kaldi;
   using namespace kaldi::nnet1;
   typedef kaldi::int32 int32;

   try {
     const char *usage =
         "Perform one iteration of Multi-stream training, truncated BPTT for LSTMs.\n"
         "The training targets are pdf-posteriors, usually prepared by ali-to-post.\n"
         "The updates are per-utterance.\n"
         "\n"
         "Usage: nnet-train-multistream [options] "
           "<feature-rspecifier> <targets-rspecifier> <model-in> [<model-out>]\n"
         "e.g.: nnet-train-lstm-streams scp:feature.scp ark:posterior.ark nnet.init nnet.iter1\n";

     ParseOptions po(usage);

     NnetTrainOptions trn_opts;
     trn_opts.Register(&po);
     LossOptions loss_opts;
     loss_opts.Register(&po);

     bool binary = true;
     po.Register("binary", &binary, "Write output in binary mode");

     bool crossvalidate = false;
     po.Register("cross-validate", &crossvalidate,
         "Perform cross-validation (don't back-propagate)");

     std::string feature_transform;
     po.Register("feature-transform", &feature_transform,
         "Feature transform in Nnet format");

     std::string objective_function = "xent";
     po.Register("objective-function", &objective_function,
         "Objective function : xent|mse");

     int32 length_tolerance = 5;
     po.Register("length-tolerance", &length_tolerance,
       "Allowed length difference of features/targets (frames)");

     std::string frame_weights;
     po.Register("frame-weights", &frame_weights,
       "Per-frame weights to scale gradients (frame selection/weighting).");

     int32 batch_size = 20;
     po.Register("batch-size", &batch_size,
       "Length of 'one stream' in the Multi-stream training");

     int32 num_streams = 4;
     po.Register("num-streams", &num_streams,
       "Number of streams in the Multi-stream training");

     bool dummy = false;
     po.Register("randomize", &dummy, "Dummy option.");

     std::string use_gpu="yes";
     po.Register("use-gpu", &use_gpu,
         "yes|no|optional, only has effect if compiled with CUDA");

     po.Read(argc, argv);

     if (po.NumArgs() != 3 + (crossvalidate ? 0 : 1)) {
       po.PrintUsage();
       exit(1);
     }

     std::string feature_rspecifier = po.GetArg(1),
       targets_rspecifier = po.GetArg(2),
       model_filename = po.GetArg(3);

     std::string target_model_filename;
     if (!crossvalidate) {
       target_model_filename = po.GetArg(4);
     }

     using namespace kaldi;
     using namespace kaldi::nnet1;
     typedef kaldi::int32 int32;

 #if HAVE_CUDA == 1
     CuDevice::Instantiate().SelectGpuId(use_gpu);
 #endif

     Nnet nnet_transf;
     if (feature_transform != "") {
       nnet_transf.Read(feature_transform);
     }

     Nnet nnet;
     nnet.Read(model_filename);
     nnet.SetTrainOptions(trn_opts);

     if (crossvalidate) {
       nnet_transf.SetDropoutRate(0.0);
       nnet.SetDropoutRate(0.0);
     }

     kaldi::int64 total_frames = 0;

     SequentialBaseFloatMatrixReader feature_reader(feature_rspecifier);
     RandomAccessPosteriorReader target_reader(targets_rspecifier);
     RandomAccessBaseFloatVectorReader weights_reader;
     if (frame_weights != "") {
       weights_reader.Open(frame_weights);
     }

     Xent xent(loss_opts);
     Mse mse(loss_opts);

     Timer time;
     double time_gpu = 0;
     KALDI_LOG << (crossvalidate ? "CROSS-VALIDATION" : "TRAINING")
               << " STARTED";

     int32 num_done = 0,
           num_no_tgt_mat = 0,
           num_other_error = 0;

     // book-keeping for multi-stream training,
     std::vector<Matrix<BaseFloat> > feats_utt(num_streams);
     std::vector<Posterior> labels_utt(num_streams);
     std::vector<Vector<BaseFloat> > weights_utt(num_streams);
     std::vector<int32> cursor_utt(num_streams); // 0 initialized,
     std::vector<int32> new_utt_flags(num_streams);

     CuMatrix<BaseFloat> feats_transf, nnet_out, obj_diff;

     // MAIN LOOP,
     while (1) {

       // Re-fill the streams, if needed,
       new_utt_flags.assign(num_streams, 0);  // set new-utterance flags to zero,
       for (int s = 0; s < num_streams; s++) {
         // Need a new utterance for stream 's'?
         if (cursor_utt[s] >= feats_utt[s].NumRows()) {
           Matrix<BaseFloat> feats;
           Posterior targets;
           Vector<BaseFloat> weights;
           // get the data from readers,
           if (ReadData(feature_reader, target_reader, weights_reader,
                        length_tolerance,
                        &feats, &targets, &weights,
                        &num_no_tgt_mat, &num_other_error)) {

             // input transform may contain splicing,
             Timer t;
             nnet_transf.Feedforward(CuMatrix<BaseFloat>(feats), &feats_transf);
             time_gpu += t.Elapsed();

             /* Here we could do the 'targets_delay', BUT...
              * It is better to do it by a <Splice> component!
              *
              * The prototype would look like this (6th frame becomes 1st frame, etc.):
              * '<Splice> <InputDim> dim1 <OutputDim> dim1 <BuildVector> 5 </BuildVector>'
              */

             // store,
             feats_utt[s] = Matrix<BaseFloat>(feats_transf);
             labels_utt[s] = targets;
             weights_utt[s] = weights;
             cursor_utt[s] = 0;
             new_utt_flags[s] = 1;
           }
         }
       }

       // End the training when 1st stream is empty
       // (this avoids over-adaptation to last utterances),
       size_t inactive_streams = 0;
       for (int32 s = 0; s < num_streams; s++) {
         if (feats_utt[s].NumRows() - cursor_utt[s] <= 0) {
           inactive_streams += 1;
         }
       }
       if (inactive_streams >= 1) {
         KALDI_LOG << "No more data to re-fill one of the streams, end of the training!";
         KALDI_LOG << "(remaining stubs of data are discarded, don't overtrain on them)";
         break;
       }

       // number of frames we'll pack as the streams,
       std::vector<int32> frame_num_utt;

       // pack the parallel data,
       Matrix<BaseFloat> feat_mat_host;
       Posterior target_host;
       Vector<BaseFloat> weight_host;
       {
         // Number of sequences (can have zero length),
         int32 n_streams = num_streams;

         // Create the final feature matrix with 'interleaved feature-lines',
         feat_mat_host.Resize(n_streams * batch_size, nnet.InputDim(), kSetZero);
         target_host.resize(n_streams * batch_size);
         weight_host.Resize(n_streams * batch_size, kSetZero);
         frame_num_utt.resize(n_streams, 0);

         // we slice at the 'cursor' at most 'batch_size' frames,
         for (int32 s = 0; s < n_streams; s++) {
           int32 num_rows = std::max(0, feats_utt[s].NumRows() - cursor_utt[s]);
           frame_num_utt[s] = std::min(batch_size, num_rows);
         }

         // pack the data,
         {
           for (int32 s = 0; s < n_streams; s++) {
             if (frame_num_utt[s] > 0) {
               auto mat_tmp = feats_utt[s].RowRange(cursor_utt[s], frame_num_utt[s]);
               for (int32 r = 0; r < frame_num_utt[s]; r++) {
                 feat_mat_host.Row(r*n_streams + s).CopyFromVec(mat_tmp.Row(r));
               }
             }
           }

           for (int32 s = 0; s < n_streams; s++) {
             for (int32 r = 0; r < frame_num_utt[s]; r++) {
               target_host[r*n_streams + s] = labels_utt[s][cursor_utt[s] + r];
             }
           }

           // padded frames will keep initial zero-weight,
           for (int32 s = 0; s < n_streams; s++) {
             if (frame_num_utt[s] > 0) {
               auto weight_tmp = weights_utt[s].Range(cursor_utt[s], frame_num_utt[s]);
               for (int32 r = 0; r < frame_num_utt[s]; r++) {
                 weight_host(r*n_streams + s) = weight_tmp(r);
               }
             }
           }
         }

         // advance the cursors,
         for (int32 s = 0; s < n_streams; s++) {
           cursor_utt[s] += frame_num_utt[s];
         }
       }

       // pass the info about padding,
       nnet.SetSeqLengths(frame_num_utt);

       // Show debug info,
       if (GetVerboseLevel() >= 4) {
         // cursors in the feature_matrices,
         {
           std::ostringstream os;
           os << "[ ";
           for (size_t i = 0; i < cursor_utt.size(); i++) {
             os << cursor_utt[i] << " ";
           }
           os << "]";
           KALDI_LOG << "cursor_utt[" << cursor_utt.size() << "]" << os.str();
         }
         // frames in the mini-batch,
         {
           std::ostringstream os;
           os << "[ ";
           for (size_t i = 0; i < frame_num_utt.size(); i++) {
             os << frame_num_utt[i] << " ";
           }
           os << "]";
           KALDI_LOG << "frame_num_utt[" << frame_num_utt.size() << "]" << os.str();
         }
       }

       Timer t;
       // with new utterance we reset the history,
       nnet.ResetStreams(new_utt_flags);

       // forward pass,
       nnet.Propagate(CuMatrix<BaseFloat>(feat_mat_host), &nnet_out);

       // evaluate objective function we've chosen,
       if (objective_function == "xent") {
         xent.Eval(weight_host, nnet_out, target_host, &obj_diff);
       } else if (objective_function == "mse") {
         mse.Eval(weight_host, nnet_out, target_host, &obj_diff);
       } else {
         KALDI_ERR << "Unknown objective function code : "
                   << objective_function;
       }

       if (!crossvalidate) {
         // back-propagate, and do the update,
         nnet.Backpropagate(obj_diff, NULL);
       }
       time_gpu += t.Elapsed();

       // 1st minibatch : show what happens in network,
       if (total_frames == 0) {
         KALDI_LOG << "### After " << total_frames << " frames,";
         KALDI_LOG << nnet.Info();
         KALDI_LOG << nnet.InfoPropagate();
         if (!crossvalidate) {
           KALDI_LOG << nnet.InfoBackPropagate();
           KALDI_LOG << nnet.InfoGradient();
         }
       }

       kaldi::int64 tmp_frames = total_frames;

       num_done += std::accumulate(new_utt_flags.begin(), new_utt_flags.end(), 0);
       total_frames += std::accumulate(frame_num_utt.begin(), frame_num_utt.end(), 0);

       // monitor the NN training (--verbose=2),
       int32 F = 25000;
       if (GetVerboseLevel() >= 2) {
         // print every 25k frames,
         if (tmp_frames / F != total_frames / F) {
           KALDI_VLOG(2) << "### After " << total_frames << " frames,";
           KALDI_VLOG(2) << nnet.Info();
           KALDI_VLOG(2) << nnet.InfoPropagate();
           if (!crossvalidate) {
             KALDI_VLOG(2) << nnet.InfoBackPropagate();
             KALDI_VLOG(2) << nnet.InfoGradient();
           }
         }
       }
     }

     // after last minibatch : show what happens in network,
     KALDI_LOG << "### After " << total_frames << " frames,";
     KALDI_LOG << nnet.Info();
     KALDI_LOG << nnet.InfoPropagate();
     if (!crossvalidate) {
       KALDI_LOG << nnet.InfoBackPropagate();
       KALDI_LOG << nnet.InfoGradient();
     }

     if (!crossvalidate) {
       nnet.Write(target_model_filename, binary);
     }

     if (objective_function == "xent") {
       KALDI_LOG << xent.ReportPerClass();
     }

     KALDI_LOG << "Done " << num_done << " files, "
       << num_no_tgt_mat << " with no tgt_mats, "
       << num_other_error << " with other errors. "
       << "[" << (crossvalidate ? "CROSS-VALIDATION" : "TRAINING")
       << ", " << time.Elapsed() / 60 << " min, processing "
       << total_frames / time.Elapsed() << " frames per sec, "
       << "GPU_time " << 100.*time_gpu/time.Elapsed() << "% ]";

     if (objective_function == "xent") {
       KALDI_LOG << xent.Report();
     } else if (objective_function == "mse") {
       KALDI_LOG << mse.Report();
     } else {
       KALDI_ERR << "Unknown objective function code : " << objective_function;
     }

 #if HAVE_CUDA == 1
     CuDevice::Instantiate().PrintProfile();
 #endif

     return 0;
   } catch(const std::exception &e) {
     std::cerr << e.what();
     return -1;
   }
 }
kaldi::nnet1::Nnet::Backpropagate
void Backpropagate(const CuMatrixBase< BaseFloat > &out_diff, CuMatrix< BaseFloat > *in_diff)
Perform backward pass through the network,.
Definition: nnet-nnet.cc:96

nnet-loss.h

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::Nnet::ResetStreams
void ResetStreams(const std::vector< int32 > &stream_reset_flag)
Reset streams in multi-stream training,.
Definition: nnet-nnet.cc:281

main
int main(int argc, char *argv[])
Definition: nnet-train-multistream.cc:109

kaldi::nnet1
Definition: dnn1.dox:21

kaldi::nnet1::Nnet::Propagate
void Propagate(const CuMatrixBase< BaseFloat > &in, CuMatrix< BaseFloat > *out)
Perform forward pass through the network,.
Definition: nnet-nnet.cc:70

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

cu-device.h

kaldi::nnet1::Nnet::SetSeqLengths
void SetSeqLengths(const std::vector< int32 > &sequence_lengths)
Set sequence length in LSTM multi-stream training,.
Definition: nnet-nnet.cc:291

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::SequentialTableReader::Key
std::string Key()
Definition: kaldi-table-inl.h:918

kaldi::GetVerboseLevel
int32 GetVerboseLevel()
Get verbosity level, usually set via command line &#39;–verbose=&#39; switch.
Definition: kaldi-error.h:60

kaldi::nnet1::Nnet::Write
void Write(const std::string &wxfilename, bool binary) const
Write Nnet to &#39;wxfilename&#39;,.
Definition: nnet-nnet.cc:367

kaldi::nnet1::Nnet::InputDim
int32 InputDim() const
Dimensionality on network input (input feature dim.),.
Definition: nnet-nnet.cc:148

kaldi::RandomAccessTableReader::Open
bool Open(const std::string &rspecifier)
Definition: kaldi-table-inl.h:2517

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::Matrix< BaseFloat >

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::Vector::Resize
void Resize(MatrixIndexT length, MatrixResizeType resize_type=kSetZero)
Set vector to a specified size (can be zero).
Definition: kaldi-vector.cc:190

kaldi::nnet1::Xent
Definition: nnet-loss.h:82

timer.h

kaldi::nnet1::LossOptions
Definition: nnet-loss.h:38

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::nnet1::Mse::Report
std::string Report()
Generate string with error report.
Definition: nnet-loss.cc:299

kaldi::RandomAccessTableReader
Allows random access to a collection of objects in an archive or script file; see The Table concept...
Definition: kaldi-table.h:233

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

kaldi::RandomAccessTableReader::Value
const T & Value(const std::string &key)
Definition: kaldi-table-inl.h:2561

kaldi::nnet1::Nnet::InfoBackPropagate
std::string InfoBackPropagate(bool header=true) const
Create string with back-propagation-buffer statistics,.
Definition: nnet-nnet.cc:443

kaldi::nnet1::Xent::Eval
void Eval(const VectorBase< BaseFloat > &frame_weights, const CuMatrixBase< BaseFloat > &net_out, const CuMatrixBase< BaseFloat > &target, CuMatrix< BaseFloat > *diff)
Evaluate cross entropy using target-matrix (supports soft labels),.
Definition: nnet-loss.cc:62

kaldi::nnet1::Xent::Report
std::string Report()
Generate string with error report,.
Definition: nnet-loss.cc:182

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

kaldi::nnet1::Mse::Eval
void Eval(const VectorBase< BaseFloat > &frame_weights, const CuMatrixBase< BaseFloat > &net_out, const CuMatrixBase< BaseFloat > &target, CuMatrix< BaseFloat > *diff)
Evaluate mean square error using target-matrix,.
Definition: nnet-loss.cc:228

kaldi::nnet1::Nnet
Definition: nnet-nnet.h:37

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::nnet1::Nnet::Read
void Read(const std::string &rxfilename)
Read Nnet from &#39;rxfilename&#39;,.
Definition: nnet-nnet.cc:333

kaldi::nnet1::NnetTrainOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-trnopts.h:46

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::RandomAccessTableReader::HasKey
bool HasKey(const std::string &key)
Definition: kaldi-table-inl.h:2551

kaldi::RandomAccessTableReader::IsOpen
bool IsOpen() const
Definition: kaldi-table.h:247

nnet-randomizer.h

kaldi::kCopyData
Definition: matrix-common.h:40

kaldi::nnet1::Nnet::Feedforward
void Feedforward(const CuMatrixBase< BaseFloat > &in, CuMatrix< BaseFloat > *out)
Perform forward pass through the network (with 2 swapping buffers),.
Definition: nnet-nnet.cc:131

kaldi::Timer
Definition: timer.h:63

nnet-trnopts.h

kaldi::nnet1::NnetTrainOptions
Definition: nnet-trnopts.h:30

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

nnet-nnet.h

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

kaldi::kSetZero
Definition: matrix-common.h:38

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::VectorBase::Set
void Set(Real f)
Set all members of a vector to a specified value.
Definition: kaldi-vector.cc:336

kaldi::nnet1::Nnet::SetDropoutRate
void SetDropoutRate(BaseFloat r)
Set the dropout rate.
Definition: nnet-nnet.cc:268

kaldi::nnet1::Nnet::InfoGradient
std::string InfoGradient(bool header=true) const
Create string with per-component gradient statistics,.
Definition: nnet-nnet.cc:407

kaldi::nnet1::Nnet::InfoPropagate
std::string InfoPropagate(bool header=true) const
Create string with propagation-buffer statistics,.
Definition: nnet-nnet.cc:420

kaldi::nnet1::Nnet::Info
std::string Info() const
Create string with human readable description of the nnet,.
Definition: nnet-nnet.cc:386

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::nnet1::Nnet::SetTrainOptions
void SetTrainOptions(const NnetTrainOptions &opts)
Set hyper-parameters of the training (pushes to all UpdatableComponents),.
Definition: nnet-nnet.cc:508

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::nnet1::Xent::ReportPerClass
std::string ReportPerClass()
Generate string with per-class error report,.
Definition: nnet-loss.cc:203

kaldi::nnet1::Mse
Definition: nnet-loss.h:149

kaldi::nnet1::LossOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-loss.h:45

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::Timer::Elapsed
double Elapsed() const
Returns time in seconds.
Definition: timer.h:74

kaldi::ReadData
bool ReadData(SequentialBaseFloatMatrixReader &feature_reader, RandomAccessPosteriorReader &target_reader, RandomAccessBaseFloatVectorReader &weights_reader, int32 length_tolerance, Matrix< BaseFloat > *feats, Posterior *targets, Vector< BaseFloat > *weights, int32 *num_no_tgt_mat, int32 *num_other_error)
Definition: nnet-train-multistream.cc:35

kaldi-common.h