doc/nnet-compute-discriminative_8cc_source.html

 // nnet2/nnet-compute-discriminative.cc

 // Copyright 2012-2013   Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "nnet2/nnet-compute-discriminative.h"
 #include "hmm/posterior.h"
 #include "lat/lattice-functions.h"

 namespace kaldi {
 namespace nnet2 {

 /*
   This class does the forward and possibly backward computation for (typically)
   a whole utterance of contiguous features.  You'll instantiate one of
   these classes each time you want to do this computation.
 */
 class NnetDiscriminativeUpdater {
  public:

   NnetDiscriminativeUpdater(const AmNnet &am_nnet,
                             const TransitionModel &tmodel,
                             const NnetDiscriminativeUpdateOptions &opts,
                             const DiscriminativeNnetExample &eg,
                             Nnet *nnet_to_update,
                             NnetDiscriminativeStats *stats);

   void Update() {
     Propagate();
     LatticeComputations();
     if (nnet_to_update_ != NULL)
       Backprop();
   }

   void Propagate();

   void LatticeComputations();

   void Backprop();

   double GetDiscriminativePosteriors(Posterior *post);

   SubMatrix<BaseFloat> GetInputFeatures() const;

   CuMatrixBase<BaseFloat> &GetOutput() { return forward_data_.back(); }

   static inline Int32Pair MakePair(int32 first, int32 second) {
     Int32Pair ans;
     ans.first = first;
     ans.second = second;
     return ans;
   }

  private:
   typedef LatticeArc Arc;
   typedef Arc::StateId StateId;


   const AmNnet &am_nnet_;
   const TransitionModel &tmodel_;
   const NnetDiscriminativeUpdateOptions &opts_;
   const DiscriminativeNnetExample &eg_;
   Nnet *nnet_to_update_; // will equal am_nnet_.GetNnet(), in SGD case, or
                          // another Nnet, in gradient-computation case, or
                          // NULL if we just need the objective function.
   NnetDiscriminativeStats *stats_; // the objective function, etc.
   std::vector<ChunkInfo> chunk_info_out_;
   // forward_data_[i] is the input of the i'th component and (if i > 0)
   // the output of the i-1'th component.
   std::vector<CuMatrix<BaseFloat> > forward_data_;
   Lattice lat_; // we convert the CompactLattice in the eg, into Lattice form.
   CuMatrix<BaseFloat> backward_data_;
   std::vector<int32> silence_phones_; // derived from opts_.silence_phones_str
 };


 NnetDiscriminativeUpdater::NnetDiscriminativeUpdater(
     const AmNnet &am_nnet,
     const TransitionModel &tmodel,
     const NnetDiscriminativeUpdateOptions &opts,
     const DiscriminativeNnetExample &eg,
     Nnet *nnet_to_update,
     NnetDiscriminativeStats *stats):
     am_nnet_(am_nnet), tmodel_(tmodel), opts_(opts), eg_(eg),
     nnet_to_update_(nnet_to_update), stats_(stats) {
   if (!SplitStringToIntegers(opts_.silence_phones_str, ":", false,
                              &silence_phones_)) {
     KALDI_ERR << "Bad value for --silence-phones option: "
               << opts_.silence_phones_str;
   }
   const Nnet &nnet = am_nnet_.GetNnet();
   nnet.ComputeChunkInfo(eg_.input_frames.NumRows(), 1, &chunk_info_out_);
 }


 SubMatrix<BaseFloat> NnetDiscriminativeUpdater::GetInputFeatures() const {
   int32 num_frames_output = eg_.num_ali.size();
   int32 eg_left_context = eg_.left_context,
       eg_right_context = eg_.input_frames.NumRows() -
       num_frames_output - eg_left_context;
   KALDI_ASSERT(eg_right_context >= 0);
   const Nnet &nnet = am_nnet_.GetNnet();
   // Make sure the example has enough acoustic left and right
   // context... normally we'll use examples generated using the same model,
   // which will have the exact context, but we enable a mismatch in context as
   // long as it is more, not less.
   KALDI_ASSERT(eg_left_context >= nnet.LeftContext() &&
                eg_right_context >= nnet.RightContext());
   int32 offset = eg_left_context - nnet.LeftContext(),
       num_output_frames =
       num_frames_output + nnet.LeftContext() + nnet.RightContext();
   SubMatrix<BaseFloat> ans(eg_.input_frames, offset, num_output_frames,
                            0, eg_.input_frames.NumCols());
   return ans;
 }

 void NnetDiscriminativeUpdater::Propagate() {
   const Nnet &nnet = am_nnet_.GetNnet();
   forward_data_.resize(nnet.NumComponents() + 1);

   SubMatrix<BaseFloat> input_feats = GetInputFeatures();
   int32 spk_dim = eg_.spk_info.Dim();
   if (spk_dim == 0) {
     forward_data_[0] = input_feats;
   } else {
     forward_data_[0].Resize(input_feats.NumRows(),
                             input_feats.NumCols() + eg_.spk_info.Dim());
     forward_data_[0].Range(0, input_feats.NumRows(),
                            0, input_feats.NumCols()).CopyFromMat(input_feats);
     forward_data_[0].Range(0, input_feats.NumRows(),
                            input_feats.NumCols(), spk_dim).CopyRowsFromVec(
                                eg_.spk_info);
   }

   for (int32 c = 0; c < nnet.NumComponents(); c++) {
     const Component &component = nnet.GetComponent(c);
     CuMatrix<BaseFloat> &input = forward_data_[c],
         &output = forward_data_[c+1];
     component.Propagate(chunk_info_out_[c] , chunk_info_out_[c+1], input, &output);
     const Component *prev_component = (c == 0 ? NULL :
                                        &(nnet.GetComponent(c-1)));
     bool will_do_backprop = (nnet_to_update_ != NULL),
         keep_last_output = will_do_backprop &&
         ((c>0 && prev_component->BackpropNeedsOutput()) ||
          component.BackpropNeedsInput());
     if (!keep_last_output)
       forward_data_[c].Resize(0, 0); // We won't need this data; save memory.
   }
 }


 void NnetDiscriminativeUpdater::LatticeComputations() {
   ConvertLattice(eg_.den_lat, &lat_); // convert to Lattice.
   TopSort(&lat_); // Topologically sort (required by forward-backward algorithms)

   if (opts_.criterion == "mmi" && opts_.boost != 0.0) {
     BaseFloat max_silence_error = 0.0;
     LatticeBoost(tmodel_, eg_.num_ali, silence_phones_,
                  opts_.boost, max_silence_error, &lat_);
   }

   int32 num_frames = static_cast<int32>(eg_.num_ali.size());

   stats_->tot_t += num_frames;
   stats_->tot_t_weighted += num_frames * eg_.weight;

   const VectorBase<BaseFloat> &priors = am_nnet_.Priors();
   const CuMatrix<BaseFloat> &posteriors = forward_data_.back();

   KALDI_ASSERT(posteriors.NumRows() == num_frames);
   int32 num_pdfs = posteriors.NumCols();
   KALDI_ASSERT(num_pdfs == priors.Dim());

   // We need to look up the posteriors of some pdf-ids in the matrix
   // "posteriors".  Rather than looking them all up using operator (), which is
   // very slow because each lookup involves a separate CUDA call with
   // communication over PciExpress, we look them up all at once using
   // CuMatrix::Lookup().
   // Note: regardless of the criterion, we evaluate the likelihoods in
   // the numerator alignment.  Even though they may be irrelevant to
   // the optimization, they will affect the value of the objective function.

   std::vector<Int32Pair> requested_indexes;
   BaseFloat wiggle_room = 1.3; // value not critical.. it's just 'reserve'
   requested_indexes.reserve(num_frames + wiggle_room * lat_.NumStates());

   if (opts_.criterion == "mmi") { // need numerator probabilities...
     for (int32 t = 0; t < num_frames; t++) {
       int32 tid = eg_.num_ali[t], pdf_id = tmodel_.TransitionIdToPdf(tid);
       KALDI_ASSERT(pdf_id >= 0 && pdf_id < num_pdfs);
       requested_indexes.push_back(MakePair(t, pdf_id));
     }
   }

   std::vector<int32> state_times;
   int32 T = LatticeStateTimes(lat_, &state_times);
   KALDI_ASSERT(T == num_frames);

   StateId num_states = lat_.NumStates();
   for (StateId s = 0; s < num_states; s++) {
     StateId t = state_times[s];
     for (fst::ArcIterator<Lattice> aiter(lat_, s); !aiter.Done(); aiter.Next()) {
       const Arc &arc = aiter.Value();
       if (arc.ilabel != 0) { // input-side has transition-ids, output-side empty
         int32 tid = arc.ilabel, pdf_id = tmodel_.TransitionIdToPdf(tid);
         requested_indexes.push_back(MakePair(t, pdf_id));
       }
     }
   }

   std::vector<BaseFloat> answers;
   CuArray<Int32Pair> cu_requested_indexes(requested_indexes);
   answers.resize(requested_indexes.size());
   posteriors.Lookup(cu_requested_indexes, &(answers[0]));

   int32 num_floored = 0;

   BaseFloat floor_val = 1.0e-20; // floor for posteriors.
   size_t index;

   // Replace "answers" with the vector of scaled log-probs.  If this step takes
   // too much time, we can look at other ways to do it, using the CUDA card.
   for (index = 0; index < answers.size(); index++) {
     BaseFloat post = answers[index];
     if (post < floor_val) {
       post = floor_val;
       num_floored++;
     }
     int32 pdf_id = requested_indexes[index].second;
     BaseFloat pseudo_loglike = Log(post / priors(pdf_id)) * opts_.acoustic_scale;
     KALDI_ASSERT(!KALDI_ISINF(pseudo_loglike) && !KALDI_ISNAN(pseudo_loglike));
     answers[index] = pseudo_loglike;
   }
   if (num_floored > 0) {
     KALDI_WARN << "Floored " << num_floored << " probabilities from nnet.";
   }

   index = 0;

   if (opts_.criterion == "mmi") {
     double tot_num_like = 0.0;
     for (; index < eg_.num_ali.size(); index++)
       tot_num_like += answers[index];
     stats_->tot_num_objf += eg_.weight * tot_num_like;
   }

   // Now put the (scaled) acoustic log-likelihoods in the lattice.
   for (StateId s = 0; s < num_states; s++) {
     for (fst::MutableArcIterator<Lattice> aiter(&lat_, s);
          !aiter.Done(); aiter.Next()) {
       Arc arc = aiter.Value();
       if (arc.ilabel != 0) { // input-side has transition-ids, output-side empty
         arc.weight.SetValue2(-answers[index]);
         index++;
         aiter.SetValue(arc);
       }
     }
     LatticeWeight final = lat_.Final(s);
     if (final != LatticeWeight::Zero()) {
       final.SetValue2(0.0); // make sure no acoustic term in final-prob.
       lat_.SetFinal(s, final);
     }
   }
   KALDI_ASSERT(index == answers.size());

   // Get the MPE or MMI posteriors.
   Posterior post;
   stats_->tot_den_objf += eg_.weight * GetDiscriminativePosteriors(&post);

   ScalePosterior(eg_.weight, &post);

   double tot_num_post = 0.0, tot_den_post = 0.0;
   std::vector<MatrixElement<BaseFloat> > sv_labels;
   sv_labels.reserve(answers.size());
   for (int32 t = 0; t < post.size(); t++) {
     for (int32 i = 0; i < post[t].size(); i++) {
       int32 pdf_id = post[t][i].first;
       BaseFloat weight = post[t][i].second;
       if (weight > 0.0) { tot_num_post += weight; }
       else { tot_den_post -= weight; }
       MatrixElement<BaseFloat> elem = {t, pdf_id, weight};
       sv_labels.push_back(elem);
     }
   }
   stats_->tot_num_count += tot_num_post;
   int32 num_components = am_nnet_.GetNnet().NumComponents();
   const CuMatrix<BaseFloat> &output(forward_data_[num_components]);
   backward_data_.Resize(output.NumRows(), output.NumCols()); // zeroes it.

   { // We don't actually need tot_objf and tot_weight; we have already
     // computed the objective function.
     BaseFloat tot_objf, tot_weight;
     backward_data_.CompObjfAndDeriv(sv_labels, output, &tot_objf, &tot_weight);
     // Now backward_data_ will contan the derivative at the output.
     // Our work here is done..
   }
 }


 double NnetDiscriminativeUpdater::GetDiscriminativePosteriors(Posterior *post) {
   if (opts_.criterion == "mpfe" || opts_.criterion == "smbr") {
     Posterior tid_post;
     double ans;
     ans = LatticeForwardBackwardMpeVariants(tmodel_, silence_phones_, lat_,
                                             eg_.num_ali, opts_.criterion,
                                             opts_.one_silence_class,
                                             &tid_post);
     ConvertPosteriorToPdfs(tmodel_, tid_post, post);
     return ans; // returns the objective function.
   } else {
     KALDI_ASSERT(opts_.criterion == "mmi");
     bool convert_to_pdfs = true, cancel = true;
     // we'll return the denominator-lattice forward backward likelihood,
     // which is one term in the objective function.
     return LatticeForwardBackwardMmi(tmodel_, lat_, eg_.num_ali,
                                      opts_.drop_frames, convert_to_pdfs,
                                      cancel, post);
   }
 }


 void NnetDiscriminativeUpdater::Backprop() {
   const Nnet &nnet = am_nnet_.GetNnet();
   for (int32 c = nnet.NumComponents() - 1; c >= 0; c--) {
     const Component &component = nnet.GetComponent(c);
     Component *component_to_update = &(nnet_to_update_->GetComponent(c));
     const CuMatrix<BaseFloat>  &input = forward_data_[c],
                             &output = forward_data_[c+1],
                       &output_deriv = backward_data_;
     CuMatrix<BaseFloat> input_deriv;
     component.Backprop(chunk_info_out_[c], chunk_info_out_[c+1], input, output, output_deriv,
                        component_to_update, &input_deriv);
     backward_data_.Swap(&input_deriv); // backward_data_ = input_deriv.
   }
 }


 void NnetDiscriminativeUpdate(const AmNnet &am_nnet,
                               const TransitionModel &tmodel,
                               const NnetDiscriminativeUpdateOptions &opts,
                               const DiscriminativeNnetExample &eg,
                               Nnet *nnet_to_update,
                               NnetDiscriminativeStats *stats) {
   NnetDiscriminativeUpdater updater(am_nnet, tmodel, opts, eg,
                                     nnet_to_update, stats);
   updater.Update();
 }

 void NnetDiscriminativeStats::Add(const NnetDiscriminativeStats &other) {
   tot_t += other.tot_t;
   tot_t_weighted += other.tot_t_weighted;
   tot_num_count += other.tot_num_count;
   tot_num_objf += other.tot_num_objf;
   tot_den_objf += other.tot_den_objf;
 }

 void NnetDiscriminativeStats::Print(std::string criterion) {
   KALDI_ASSERT(criterion == "mmi" || criterion == "smbr" ||
                criterion == "mpfe");

   double avg_post_per_frame = tot_num_count / tot_t_weighted;
   KALDI_LOG << "Number of frames is " << tot_t
             << " (weighted: " << tot_t_weighted
             << "), average (num or den) posterior per frame is "
             << avg_post_per_frame;

   if (criterion == "mmi") {
     double num_objf = tot_num_objf / tot_t_weighted,
         den_objf = tot_den_objf / tot_t_weighted,
         objf = num_objf - den_objf;
     KALDI_LOG << "MMI objective function is " << num_objf << " - "
               << den_objf << " = " << objf << " per frame, over "
               << tot_t_weighted << " frames.";
   } else if (criterion == "mpfe") {
     double objf = tot_den_objf / tot_t_weighted; // this contains the actual
                                                  // summed objf
     KALDI_LOG << "MPFE objective function is " << objf
               << " per frame, over " << tot_t_weighted << " frames.";
   } else {
     double objf = tot_den_objf / tot_t_weighted; // this contains the actual
                                                  // summed objf
     KALDI_LOG << "SMBR objective function is " << objf
               << " per frame, over " << tot_t_weighted << " frames.";
   }
 }


 } // namespace nnet2
 } // namespace kaldi
fst::StateId
fst::StdArc::StateId StateId
Definition: deterministic-fst-test.cc:58

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet2::Nnet::GetComponent
const Component & GetComponent(int32 c) const
Definition: nnet-nnet.cc:141

kaldi::nnet2::Nnet::LeftContext
int32 LeftContext() const
Returns the left-context summed over all the Components...
Definition: nnet-nnet.cc:42

kaldi::nnet2::NnetDiscriminativeUpdater::StateId
Arc::StateId StateId
Definition: nnet-compute-discriminative.cc:79

kaldi::nnet2::NnetDiscriminativeUpdater::lat_
Lattice lat_
Definition: nnet-compute-discriminative.cc:94

kaldi::LatticeArc
fst::ArcTpl< LatticeWeight > LatticeArc
Definition: kaldi-lattice.h:40

kaldi::nnet2::NnetDiscriminativeUpdateOptions::acoustic_scale
BaseFloat acoustic_scale
Definition: nnet-compute-discriminative.h:37

kaldi::nnet2::NnetDiscriminativeUpdater::silence_phones_
std::vector< int32 > silence_phones_
Definition: nnet-compute-discriminative.cc:96

kaldi::nnet2::NnetDiscriminativeUpdater::backward_data_
CuMatrix< BaseFloat > backward_data_
Definition: nnet-compute-discriminative.cc:95

kaldi::nnet2::NnetDiscriminativeStats::tot_num_count
double tot_num_count
Definition: nnet-compute-discriminative.h:73

kaldi::LatticeStateTimes
int32 LatticeStateTimes(const Lattice &lat, vector< int32 > *times)
This function iterates over the states of a topologically sorted lattice and counts the time instance...
Definition: lattice-functions.cc:78

kaldi::nnet2::NnetDiscriminativeUpdater::eg_
const DiscriminativeNnetExample & eg_
Definition: nnet-compute-discriminative.cc:85

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::nnet2::AmNnet
Definition: am-nnet.h:38

kaldi::nnet2::NnetDiscriminativeUpdater::forward_data_
std::vector< CuMatrix< BaseFloat > > forward_data_
Definition: nnet-compute-discriminative.cc:93

MatrixElement
Definition: cu-matrixdim.h:35

kaldi::SplitStringToIntegers
bool SplitStringToIntegers(const std::string &full, const char *delim, bool omit_empty_strings, std::vector< I > *out)
Split a string (e.g.
Definition: text-utils.h:68

kaldi::nnet2::NnetDiscriminativeStats
Definition: nnet-compute-discriminative.h:70

kaldi::nnet2::Component
Abstract class, basic element of the network, it is a box with defined inputs, outputs, and tranformation functions interface.
Definition: nnet-component.h:157

KALDI_ISINF
#define KALDI_ISINF
Definition: kaldi-math.h:73

kaldi::nnet2::Component::BackpropNeedsInput
virtual bool BackpropNeedsInput() const
Definition: nnet-component.h:235

kaldi::nnet2::NnetDiscriminativeUpdater::stats_
NnetDiscriminativeStats * stats_
Definition: nnet-compute-discriminative.cc:89

kaldi::nnet2::NnetDiscriminativeUpdater::MakePair
static Int32Pair MakePair(int32 first, int32 second)
Definition: nnet-compute-discriminative.cc:70

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet2::NnetDiscriminativeUpdateOptions::one_silence_class
bool one_silence_class
Definition: nnet-compute-discriminative.h:40

kaldi::TransitionModel::TransitionIdToPdf
int32 TransitionIdToPdf(int32 trans_id) const
Definition: transition-model.h:327

kaldi::nnet2::NnetDiscriminativeUpdater::GetInputFeatures
SubMatrix< BaseFloat > GetInputFeatures() const
Definition: nnet-compute-discriminative.cc:121

fst::LatticeWeightTpl< BaseFloat >

posterior.h

kaldi::nnet2::NnetDiscriminativeUpdater::chunk_info_out_
std::vector< ChunkInfo > chunk_info_out_
Definition: nnet-compute-discriminative.cc:90

kaldi::TransitionModel
Definition: transition-model.h:123

lattice-functions.h

kaldi::nnet2::NnetDiscriminativeStats::Add
void Add(const NnetDiscriminativeStats &other)
Definition: nnet-compute-discriminative.cc:376

kaldi::CuMatrixBase::Lookup
void Lookup(const std::vector< Int32Pair > &indexes, Real *output) const
Definition: cu-matrix.cc:3370

kaldi::nnet2::Nnet::NumComponents
int32 NumComponents() const
Returns number of components– think of this as similar to # of layers, but e.g.
Definition: nnet-nnet.h:69

kaldi::nnet2::NnetDiscriminativeUpdater
Definition: nnet-compute-discriminative.cc:32

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::nnet2::NnetDiscriminativeUpdater::Backprop
void Backprop()
Definition: nnet-compute-discriminative.cc:349

kaldi::LatticeForwardBackwardMmi
BaseFloat LatticeForwardBackwardMmi(const TransitionModel &tmodel, const Lattice &lat, const std::vector< int32 > &num_ali, bool drop_frames, bool convert_to_pdf_ids, bool cancel, Posterior *post)
This function can be used to compute posteriors for MMI, with a positive contribution for the numerat...
Definition: lattice-functions.cc:1414

kaldi::Log
double Log(double x)
Definition: kaldi-math.h:100

kaldi::nnet2::NnetDiscriminativeUpdateOptions
Definition: nnet-compute-discriminative.h:35

float

kaldi::nnet2::NnetDiscriminativeUpdater::am_nnet_
const AmNnet & am_nnet_
Definition: nnet-compute-discriminative.cc:82

kaldi::nnet2::NnetDiscriminativeUpdater::NnetDiscriminativeUpdater
NnetDiscriminativeUpdater(const AmNnet &am_nnet, const TransitionModel &tmodel, const NnetDiscriminativeUpdateOptions &opts, const DiscriminativeNnetExample &eg, Nnet *nnet_to_update, NnetDiscriminativeStats *stats)
Definition: nnet-compute-discriminative.cc:101

kaldi::nnet2::AmNnet::Priors
const VectorBase< BaseFloat > & Priors() const
Definition: am-nnet.h:67

kaldi::nnet2::Nnet::RightContext
int32 RightContext() const
Returns the right-context summed over all the Components...
Definition: nnet-nnet.cc:56

kaldi::nnet2::NnetDiscriminativeUpdater::GetDiscriminativePosteriors
double GetDiscriminativePosteriors(Posterior *post)
Assuming the lattice already has the correct scores in it, this function does the MPE or MMI forward-...
Definition: nnet-compute-discriminative.cc:326

kaldi::nnet2::NnetDiscriminativeStats::tot_t_weighted
double tot_t_weighted
Definition: nnet-compute-discriminative.h:72

fst::ConvertLattice
void ConvertLattice(const ExpandedFst< ArcTpl< Weight > > &ifst, MutableFst< ArcTpl< CompactLatticeWeightTpl< Weight, Int > > > *ofst, bool invert)
Convert lattice from a normal FST to a CompactLattice FST.
Definition: lattice-utils-inl.h:33

kaldi::nnet2::NnetDiscriminativeUpdateOptions::silence_phones_str
std::string silence_phones_str
Definition: nnet-compute-discriminative.h:43

fst::LatticeWeightTpl< BaseFloat >::Zero
static const LatticeWeightTpl Zero()
Definition: lattice-weight.h:76

kaldi::nnet2::DiscriminativeNnetExample::spk_info
Vector< BaseFloat > spk_info
spk_info contains any component of the features that varies slowly or not at all with time (and hence...
Definition: nnet-example.h:171

kaldi::nnet2::Nnet
Definition: nnet-nnet.h:63

kaldi::Lattice
fst::VectorFst< LatticeArc > Lattice
Definition: kaldi-lattice.h:44

kaldi::nnet2::Component::Backprop
virtual void Backprop(const ChunkInfo &in_info, const ChunkInfo &out_info, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, Component *to_update, CuMatrix< BaseFloat > *in_deriv) const =0
Perform backward pass propagation of the derivative, and also either update the model (if to_update =...

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::LatticeForwardBackwardMpeVariants
BaseFloat LatticeForwardBackwardMpeVariants(const TransitionModel &trans, const std::vector< int32 > &silence_phones, const Lattice &lat, const std::vector< int32 > &num_ali, std::string criterion, bool one_silence_class, Posterior *post)
This function implements either the MPFE (minimum phone frame error) or SMBR (state-level minimum bay...
Definition: lattice-functions.cc:794

kaldi::nnet2::NnetDiscriminativeUpdateOptions::boost
BaseFloat boost
Definition: nnet-compute-discriminative.h:41

kaldi::nnet2::DiscriminativeNnetExample::den_lat
CompactLattice den_lat
The denominator lattice.
Definition: nnet-example.h:148

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::nnet2::DiscriminativeNnetExample::input_frames
Matrix< BaseFloat > input_frames
The input data– typically with a number of frames [NumRows()] larger than labels.size(), because it includes features to the left and right as needed for the temporal context of the network.
Definition: nnet-example.h:159

kaldi::nnet2::DiscriminativeNnetExample::num_ali
std::vector< int32 > num_ali
The numerator alignment.
Definition: nnet-example.h:143

kaldi::nnet2::DiscriminativeNnetExample::weight
BaseFloat weight
The weight we assign to this example; this will typically be one, but we include it for the sake of g...
Definition: nnet-example.h:140

kaldi::nnet2::NnetDiscriminativeUpdater::Update
void Update()
Definition: nnet-compute-discriminative.cc:42

kaldi::ScalePosterior
void ScalePosterior(BaseFloat scale, Posterior *post)
Scales the BaseFloat (weight) element in the posterior entries.
Definition: posterior.cc:218

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet2::NnetDiscriminativeStats::Print
void Print(std::string criterion)
Definition: nnet-compute-discriminative.cc:384

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::nnet2::NnetDiscriminativeUpdater::LatticeComputations
void LatticeComputations()
Does the parts between Propagate() and Backprop(), that involve forward-backward over the lattice...
Definition: nnet-compute-discriminative.cc:178

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::nnet2::NnetDiscriminativeStats::tot_den_objf
double tot_den_objf
Definition: nnet-compute-discriminative.h:78

kaldi::nnet2::DiscriminativeNnetExample
This struct is used to store the information we need for discriminative training (MMI or MPE)...
Definition: nnet-example.h:136

kaldi::nnet2::Component::Propagate
virtual void Propagate(const ChunkInfo &in_info, const ChunkInfo &out_info, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const =0
Perform forward pass propagation Input->Output.

nnet-compute-discriminative.h

KALDI_ISNAN
#define KALDI_ISNAN
Definition: kaldi-math.h:72

kaldi::CuArray< Int32Pair >

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet2::NnetDiscriminativeUpdater::opts_
const NnetDiscriminativeUpdateOptions & opts_
Definition: nnet-compute-discriminative.cc:84

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::nnet2::NnetDiscriminativeUpdater::Arc
LatticeArc Arc
Definition: nnet-compute-discriminative.cc:78

kaldi::nnet2::NnetDiscriminativeUpdater::nnet_to_update_
Nnet * nnet_to_update_
Definition: nnet-compute-discriminative.cc:86

kaldi::LatticeBoost
bool LatticeBoost(const TransitionModel &trans, const std::vector< int32 > &alignment, const std::vector< int32 > &silence_phones, BaseFloat b, BaseFloat max_silence_error, Lattice *lat)
Boosts LM probabilities by b * [number of frame errors]; equivalently, adds -b*[number of frame error...
Definition: lattice-functions.cc:735

Int32Pair
Definition: cu-matrixdim.h:78

kaldi::nnet2::NnetDiscriminativeUpdateOptions::criterion
std::string criterion
Definition: nnet-compute-discriminative.h:36

Int32Pair::second
int32_cuda second
Definition: cu-matrixdim.h:80

kaldi::nnet2::NnetDiscriminativeUpdater::Propagate
void Propagate()
The forward-through-the-layers part of the computation.
Definition: nnet-compute-discriminative.cc:142

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::nnet2::NnetDiscriminativeStats::tot_t
double tot_t
Definition: nnet-compute-discriminative.h:71

kaldi::ConvertPosteriorToPdfs
void ConvertPosteriorToPdfs(const TransitionModel &tmodel, const Posterior &post_in, Posterior *post_out)
Converts a posterior over transition-ids to be a posterior over pdf-ids.
Definition: posterior.cc:322

kaldi::nnet2::DiscriminativeNnetExample::left_context
int32 left_context
The number of frames of left context in the features (we can work out the #frames of right context fr...
Definition: nnet-example.h:164

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::nnet2::NnetDiscriminativeUpdater::GetOutput
CuMatrixBase< BaseFloat > & GetOutput()
Definition: nnet-compute-discriminative.cc:68

kaldi::nnet2::Nnet::ComputeChunkInfo
void ComputeChunkInfo(int32 input_chunk_size, int32 num_chunks, std::vector< ChunkInfo > *chunk_info_out) const
Uses the output of the Context() functions of the network, to compute a vector of size NumComponents(...
Definition: nnet-nnet.cc:65

kaldi::SubMatrix
Sub-matrix representation.
Definition: kaldi-matrix.h:988

kaldi::nnet2::Component::BackpropNeedsOutput
virtual bool BackpropNeedsOutput() const
Definition: nnet-component.h:237

kaldi::nnet2::NnetDiscriminativeUpdateOptions::drop_frames
bool drop_frames
Definition: nnet-compute-discriminative.h:38

kaldi::nnet2::AmNnet::GetNnet
const Nnet & GetNnet() const
Definition: am-nnet.h:61

kaldi::nnet2::NnetDiscriminativeStats::tot_num_objf
double tot_num_objf
Definition: nnet-compute-discriminative.h:76

kaldi::nnet2::NnetDiscriminativeUpdate
void NnetDiscriminativeUpdate(const AmNnet &am_nnet, const TransitionModel &tmodel, const NnetDiscriminativeUpdateOptions &opts, const DiscriminativeNnetExample &eg, Nnet *nnet_to_update, NnetDiscriminativeStats *stats)
Does the neural net computation, lattice forward-backward, and backprop, for either the MMI...
Definition: nnet-compute-discriminative.cc:365

Int32Pair::first
int32_cuda first
Definition: cu-matrixdim.h:79

kaldi::nnet2::NnetDiscriminativeUpdater::tmodel_
const TransitionModel & tmodel_
Definition: nnet-compute-discriminative.cc:83