doc/online-ivector-feature_8cc_source.html

 // online2/online-ivector-feature.cc

 // Copyright 2014  Daniel Povey

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "online2/online-ivector-feature.h"

 namespace kaldi {

 OnlineIvectorExtractionInfo::OnlineIvectorExtractionInfo(
     const OnlineIvectorExtractionConfig &config) {
   Init(config);
 }

 void OnlineIvectorExtractionInfo::Init(
     const OnlineIvectorExtractionConfig &config) {
   online_cmvn_iextractor = config.online_cmvn_iextractor;
   ivector_period = config.ivector_period;
   num_gselect = config.num_gselect;
   min_post = config.min_post;
   posterior_scale = config.posterior_scale;
   max_count = config.max_count;
   num_cg_iters = config.num_cg_iters;
   use_most_recent_ivector = config.use_most_recent_ivector;
   greedy_ivector_extractor = config.greedy_ivector_extractor;
   if (greedy_ivector_extractor && !use_most_recent_ivector) {
     KALDI_WARN << "--greedy-ivector-extractor=true implies "
                << "--use-most-recent-ivector=true";
     use_most_recent_ivector = true;
   }
   max_remembered_frames = config.max_remembered_frames;

   std::string note = "(note: this may be needed "
       "in the file supplied to --ivector-extractor-config)";
   if (config.lda_mat_rxfilename == "")
     KALDI_ERR << "--lda-matrix option must be set " << note;
   ReadKaldiObject(config.lda_mat_rxfilename, &lda_mat);
   if (config.global_cmvn_stats_rxfilename == "")
     KALDI_ERR << "--global-cmvn-stats option must be set " << note;
   ReadKaldiObject(config.global_cmvn_stats_rxfilename, &global_cmvn_stats);
   if (config.cmvn_config_rxfilename == "")
     KALDI_ERR << "--cmvn-config option must be set " << note;
   ReadConfigFromFile(config.cmvn_config_rxfilename, &cmvn_opts);
   if (config.splice_config_rxfilename == "")
     KALDI_ERR << "--splice-config option must be set " << note;
   ReadConfigFromFile(config.splice_config_rxfilename, &splice_opts);
   if (config.diag_ubm_rxfilename == "")
     KALDI_ERR << "--diag-ubm option must be set " << note;
   ReadKaldiObject(config.diag_ubm_rxfilename, &diag_ubm);
   if (config.ivector_extractor_rxfilename == "")
     KALDI_ERR << "--ivector-extractor option must be set " << note;
   ReadKaldiObject(config.ivector_extractor_rxfilename, &extractor);
   this->Check();
 }

 int32 OnlineIvectorExtractionInfo::ExpectedFeatureDim() const {
   int32 num_splice = 1 + splice_opts.left_context + splice_opts.right_context,
       full_dim = lda_mat.NumCols();
   if (!(full_dim % num_splice == 0 || full_dim % num_splice == 1)){
     KALDI_WARN << "Error getting expected feature dimension: full-dim = "
                << full_dim << ", num-splice = " << num_splice;
   }
   return full_dim / num_splice;
 }

 void OnlineIvectorExtractionInfo::Check() const {
   KALDI_ASSERT(global_cmvn_stats.NumRows() == 2);
   int32 base_feat_dim = global_cmvn_stats.NumCols() - 1,
       num_splice = splice_opts.left_context + 1 + splice_opts.right_context,
       spliced_input_dim = base_feat_dim * num_splice;

   KALDI_ASSERT(lda_mat.NumCols() == spliced_input_dim ||
                lda_mat.NumCols() == spliced_input_dim + 1);
   KALDI_ASSERT(lda_mat.NumRows() == diag_ubm.Dim());
   KALDI_ASSERT(diag_ubm.Dim() == extractor.FeatDim());
   KALDI_ASSERT(ivector_period > 0);
   KALDI_ASSERT(num_gselect > 0);
   KALDI_ASSERT(min_post < 0.5);
   // posterior scale more than one does not really make sense.
   KALDI_ASSERT(posterior_scale > 0.0 && posterior_scale <= 1.0);
   KALDI_ASSERT(max_remembered_frames >= 0);
 }

 // The class constructed in this way should never be used.
 OnlineIvectorExtractionInfo::OnlineIvectorExtractionInfo():
     ivector_period(0), num_gselect(0), min_post(0.0), posterior_scale(0.0),
     use_most_recent_ivector(true), greedy_ivector_extractor(false),
     max_remembered_frames(0) { }

 OnlineIvectorExtractorAdaptationState::OnlineIvectorExtractorAdaptationState(
     const OnlineIvectorExtractorAdaptationState &other):
     cmvn_state(other.cmvn_state), ivector_stats(other.ivector_stats) { }


 void OnlineIvectorExtractorAdaptationState::LimitFrames(
     BaseFloat max_remembered_frames, BaseFloat posterior_scale) {
   KALDI_ASSERT(max_remembered_frames >= 0);
   KALDI_ASSERT(cmvn_state.frozen_state.NumRows() == 0);
   if (cmvn_state.speaker_cmvn_stats.NumRows() != 0) {
     int32 feat_dim = cmvn_state.speaker_cmvn_stats.NumCols() - 1;
     BaseFloat count = cmvn_state.speaker_cmvn_stats(0, feat_dim);
     if (count > max_remembered_frames)
       cmvn_state.speaker_cmvn_stats.Scale(max_remembered_frames / count);
   }
   // the stats for the iVector have been scaled by info_.posterior_scale,
   // so we need to take this in account when setting the target count.
   BaseFloat max_remembered_frames_scaled =
       max_remembered_frames * posterior_scale;
   if (ivector_stats.Count() > max_remembered_frames_scaled) {
     ivector_stats.Scale(max_remembered_frames_scaled /
                         ivector_stats.Count());
   }
 }

 void OnlineIvectorExtractorAdaptationState::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<OnlineIvectorExtractorAdaptationState>");  // magic string.
   WriteToken(os, binary, "<CmvnState>");
   cmvn_state.Write(os, binary);
   WriteToken(os, binary, "<IvectorStats>");
   ivector_stats.Write(os, binary);
   WriteToken(os, binary, "</OnlineIvectorExtractorAdaptationState>");
 }

 void OnlineIvectorExtractorAdaptationState::Read(std::istream &is, bool binary) {
   ExpectToken(is, binary, "<OnlineIvectorExtractorAdaptationState>");  // magic string.
   ExpectToken(is, binary, "<CmvnState>");
   cmvn_state.Read(is, binary);
   ExpectToken(is, binary, "<IvectorStats>");
   ivector_stats.Read(is, binary);
   ExpectToken(is, binary, "</OnlineIvectorExtractorAdaptationState>");
 }

 int32 OnlineIvectorFeature::Dim() const {
   return info_.extractor.IvectorDim();
 }

 bool OnlineIvectorFeature::IsLastFrame(int32 frame) const {
   // Note: it might be more logical to return, say, lda_->IsLastFrame()
   // since this is the feature the iVector extractor directly consumes,
   // but it will give the same answer as base_->IsLastFrame() anyway.
   // [note: the splicing component pads at begin and end so it always
   // returns the same number of frames as its input.]
   return base_->IsLastFrame(frame);
 }

 int32 OnlineIvectorFeature::NumFramesReady() const {
   KALDI_ASSERT(lda_ != NULL);
   return lda_->NumFramesReady();
 }

 BaseFloat OnlineIvectorFeature::FrameShiftInSeconds() const {
   return lda_->FrameShiftInSeconds();
 }

 void OnlineIvectorFeature::UpdateFrameWeights(
     const std::vector<std::pair<int32, BaseFloat> > &delta_weights) {
   // add the elements to delta_weights_, which is a priority queue.  The top
   // element of the priority queue is the lowest numbered frame (we ensured this
   // by making the comparison object std::greater instead of std::less).  Adding
   // elements from top (lower-numbered frames) to bottom (higher-numbered
   // frames) should be most efficient, assuming it's a heap internally.  So we
   // go forward not backward in delta_weights while adding.
   for (size_t i = 0; i < delta_weights.size(); i++) {
     delta_weights_.push(delta_weights[i]);
     int32 frame = delta_weights[i].first;
     KALDI_ASSERT(frame >= 0);
     if (frame > most_recent_frame_with_weight_)
       most_recent_frame_with_weight_ = frame;
   }
   delta_weights_provided_ = true;
 }


 BaseFloat OnlineIvectorFeature::GetMinPost(BaseFloat weight) const {
   BaseFloat min_post = info_.min_post;
   BaseFloat abs_weight = fabs(weight);
   // If we return 0.99, it will have the same effect as just picking the
   // most probable Gaussian on that frame.
   if (abs_weight == 0.0)
     return 0.99;   // I don't anticipate reaching here.
   min_post /= abs_weight;
   if (min_post > 0.99)
     min_post = 0.99;
   return min_post;
 }

 void OnlineIvectorFeature::UpdateStatsForFrames(
     const std::vector<std::pair<int32, BaseFloat> > &frame_weights_in) {

   std::vector<std::pair<int32, BaseFloat> > frame_weights(frame_weights_in);
   // Remove duplicates of frames.
   MergePairVectorSumming(&frame_weights);

   if (frame_weights.empty())
     return;

   int32 num_frames = static_cast<int32>(frame_weights.size());
   int32 feat_dim = lda_normalized_->Dim();
   Matrix<BaseFloat> feats(num_frames, feat_dim, kUndefined),
       log_likes;

   std::vector<int32> frames;
   frames.reserve(frame_weights.size());
   for (int32 i = 0; i < num_frames; i++)
     frames.push_back(frame_weights[i].first);
   lda_normalized_->GetFrames(frames, &feats);

   info_.diag_ubm.LogLikelihoods(feats, &log_likes);

   // "posteriors" stores, for each frame index in the range of frames, the
   // pruned posteriors for the Gaussians in the UBM.
   std::vector<std::vector<std::pair<int32, BaseFloat> > > posteriors(num_frames);
   for (int32 i = 0; i < num_frames; i++) {
     std::vector<std::pair<int32, BaseFloat> > &posterior = posteriors[i];
     BaseFloat weight = frame_weights[i].second;
     if (weight != 0.0) {
       tot_ubm_loglike_ += weight *
           VectorToPosteriorEntry(log_likes.Row(i), info_.num_gselect,
                                  GetMinPost(weight), &posterior);
       for (size_t j = 0; j < posterior.size(); j++)
         posterior[j].second *= info_.posterior_scale * weight;
     }
   }

   if (! info_.online_cmvn_iextractor) {
     lda_->GetFrames(frames, &feats);  // default, get features without OnlineCmvn
   } else {
     lda_normalized_->GetFrames(frames, &feats); // get features with OnlineCmvn
   }
   ivector_stats_.AccStats(info_.extractor, feats, posteriors);
 }


 void OnlineIvectorFeature::UpdateStatsUntilFrame(int32 frame) {
   KALDI_ASSERT(frame >= 0 && frame < this->NumFramesReady() &&
                !delta_weights_provided_);
   updated_with_no_delta_weights_ = true;

   int32 ivector_period = info_.ivector_period;
   int32 num_cg_iters = info_.num_cg_iters;

   std::vector<std::pair<int32, BaseFloat> > frame_weights;

   for (; num_frames_stats_ <= frame; num_frames_stats_++) {
     int32 t = num_frames_stats_;
     BaseFloat frame_weight = 1.0;
     frame_weights.push_back(std::pair<int32, BaseFloat>(t, frame_weight));
     if ((!info_.use_most_recent_ivector && t % ivector_period == 0) ||
         (info_.use_most_recent_ivector && t == frame)) {
       // The call below to UpdateStatsForFrames() is equivalent to doing, for
       // all valid indexes i:
       //  UpdateStatsForFrame(cur_start_frame + i, frame_weights[i])
       UpdateStatsForFrames(frame_weights);
       frame_weights.clear();
       ivector_stats_.GetIvector(num_cg_iters, &current_ivector_);
       if (!info_.use_most_recent_ivector) {  // need to cache iVectors.
         int32 ivec_index = t / ivector_period;
         KALDI_ASSERT(ivec_index == static_cast<int32>(ivectors_history_.size()));
         ivectors_history_.push_back(new Vector<BaseFloat>(current_ivector_));
       }
     }
   }
   if (!frame_weights.empty())
     UpdateStatsForFrames(frame_weights);
 }

 void OnlineIvectorFeature::UpdateStatsUntilFrameWeighted(int32 frame) {
   KALDI_ASSERT(frame >= 0 && frame < this->NumFramesReady() &&
                delta_weights_provided_ &&
                ! updated_with_no_delta_weights_ &&
                frame <= most_recent_frame_with_weight_);
   bool debug_weights = false;

   int32 ivector_period = info_.ivector_period;
   int32 num_cg_iters = info_.num_cg_iters;

   std::vector<std::pair<int32, BaseFloat> > frame_weights;
   frame_weights.reserve(delta_weights_.size());

   for (; num_frames_stats_ <= frame; num_frames_stats_++) {
     int32 t = num_frames_stats_;
     // Instead of just updating frame t, we update all frames that need updating
     // with index <= t, in case old frames were reclassified as silence/nonsilence.
     while (!delta_weights_.empty() &&
            delta_weights_.top().first <= t) {
       int32 frame = delta_weights_.top().first;
       BaseFloat weight = delta_weights_.top().second;
       frame_weights.push_back(delta_weights_.top());
       delta_weights_.pop();
       if (debug_weights) {
         if (current_frame_weight_debug_.size() <= frame)
           current_frame_weight_debug_.resize(frame + 1, 0.0);
         current_frame_weight_debug_[frame] += weight;
       }
     }
     if ((!info_.use_most_recent_ivector && t % ivector_period == 0) ||
         (info_.use_most_recent_ivector && t == frame)) {
       UpdateStatsForFrames(frame_weights);
       frame_weights.clear();
       ivector_stats_.GetIvector(num_cg_iters, &current_ivector_);
       if (!info_.use_most_recent_ivector) {  // need to cache iVectors.
         int32 ivec_index = t / ivector_period;
         KALDI_ASSERT(ivec_index == static_cast<int32>(ivectors_history_.size()));
         ivectors_history_.push_back(new Vector<BaseFloat>(current_ivector_));
       }
     }
   }
   if (!frame_weights.empty())
     UpdateStatsForFrames(frame_weights);
 }


 void OnlineIvectorFeature::GetFrame(int32 frame,
                                     VectorBase<BaseFloat> *feat) {
   int32 frame_to_update_until = (info_.greedy_ivector_extractor ?
                                  lda_->NumFramesReady() - 1 : frame);
   if (!delta_weights_provided_)  // No silence weighting.
     UpdateStatsUntilFrame(frame_to_update_until);
   else
     UpdateStatsUntilFrameWeighted(frame_to_update_until);

   KALDI_ASSERT(feat->Dim() == this->Dim());

   if (info_.use_most_recent_ivector) {
     KALDI_VLOG(5) << "due to --use-most-recent-ivector=true, using iVector "
                   << "from frame " << num_frames_stats_ << " for frame "
                   << frame;
     // use the most recent iVector we have, even if 'frame' is significantly in
     // the past.
     feat->CopyFromVec(current_ivector_);
     // Subtract the prior-mean from the first dimension of the output feature so
     // it's approximately zero-mean.
     (*feat)(0) -= info_.extractor.PriorOffset();
   } else {
     int32 i = frame / info_.ivector_period;  // rounds down.
     // if the following fails, UpdateStatsUntilFrame would have a bug.
     KALDI_ASSERT(static_cast<size_t>(i) <  ivectors_history_.size());
     feat->CopyFromVec(*(ivectors_history_[i]));
     (*feat)(0) -= info_.extractor.PriorOffset();
   }
 }

 void OnlineIvectorFeature::PrintDiagnostics() const {
   if (num_frames_stats_ == 0) {
     KALDI_VLOG(3) << "Processed no data.";
   } else {
     KALDI_VLOG(3) << "UBM log-likelihood was "
                   << (tot_ubm_loglike_ / NumFrames())
                   << " per frame, over " << NumFrames()
                   << " frames.";

     Vector<BaseFloat> temp_ivector(current_ivector_);
     temp_ivector(0) -= info_.extractor.PriorOffset();

     KALDI_VLOG(2) << "By the end of the utterance, objf change/frame "
                   << "from estimating iVector (vs. default) was "
                   << ivector_stats_.ObjfChange(current_ivector_)
                   << " and iVector length was "
                   << temp_ivector.Norm(2.0);
   }
 }

 OnlineIvectorFeature::~OnlineIvectorFeature() {
   PrintDiagnostics();
   // Delete objects owned here.
   for (size_t i = 0; i < to_delete_.size(); i++)
     delete to_delete_[i];
   for (size_t i = 0; i < ivectors_history_.size(); i++)
     delete ivectors_history_[i];
 }

 void OnlineIvectorFeature::GetAdaptationState(
     OnlineIvectorExtractorAdaptationState *adaptation_state) const {
   // Note: the following call will work even if cmvn_->NumFramesReady() == 0; in
   // that case it will return the unmodified adaptation state that cmvn_ was
   // initialized with.
   cmvn_->GetState(cmvn_->NumFramesReady() - 1,
                   &(adaptation_state->cmvn_state));
   adaptation_state->ivector_stats = ivector_stats_;
   adaptation_state->LimitFrames(info_.max_remembered_frames,
                                 info_.posterior_scale);
 }


 OnlineIvectorFeature::OnlineIvectorFeature(
     const OnlineIvectorExtractionInfo &info,
     OnlineFeatureInterface *base_feature):
     info_(info),
     base_(base_feature),
     ivector_stats_(info_.extractor.IvectorDim(),
                    info_.extractor.PriorOffset(),
                    info_.max_count),
     num_frames_stats_(0), delta_weights_provided_(false),
     updated_with_no_delta_weights_(false),
     most_recent_frame_with_weight_(-1), tot_ubm_loglike_(0.0) {
   info.Check();
   KALDI_ASSERT(base_feature != NULL);
   OnlineFeatureInterface *splice_feature = new OnlineSpliceFrames(info_.splice_opts, base_feature);
   to_delete_.push_back(splice_feature);
   OnlineFeatureInterface *lda_feature = new OnlineTransform(info.lda_mat, splice_feature);
   to_delete_.push_back(lda_feature);
   OnlineFeatureInterface *lda_cache_feature = new OnlineCacheFeature(lda_feature);
   lda_ = lda_cache_feature;
   to_delete_.push_back(lda_cache_feature);


   OnlineCmvnState naive_cmvn_state(info.global_cmvn_stats);
   // Note: when you call this constructor the CMVN state knows nothing
   // about the speaker.  If you want to inform this class about more specific
   // adaptation state, call this->SetAdaptationState(), most likely derived
   // from a call to GetAdaptationState() from a previous object of this type.
   cmvn_ = new OnlineCmvn(info.cmvn_opts, naive_cmvn_state, base_feature);
   to_delete_.push_back(cmvn_);

   OnlineFeatureInterface *splice_normalized =
       new OnlineSpliceFrames(info_.splice_opts, cmvn_),
       *lda_normalized =
       new OnlineTransform(info.lda_mat, splice_normalized),
       *cache_normalized = new OnlineCacheFeature(lda_normalized);
   lda_normalized_ = cache_normalized;

   to_delete_.push_back(splice_normalized);
   to_delete_.push_back(lda_normalized);
   to_delete_.push_back(cache_normalized);

   // Set the iVector to its default value, [ prior_offset, 0, 0, ... ].
   current_ivector_.Resize(info_.extractor.IvectorDim());
   current_ivector_(0) = info_.extractor.PriorOffset();
 }

 void OnlineIvectorFeature::SetAdaptationState(
     const OnlineIvectorExtractorAdaptationState &adaptation_state) {
   KALDI_ASSERT(num_frames_stats_ == 0 &&
                "SetAdaptationState called after frames were processed.");
   KALDI_ASSERT(ivector_stats_.IvectorDim() ==
                adaptation_state.ivector_stats.IvectorDim());
   ivector_stats_ = adaptation_state.ivector_stats;
   cmvn_->SetState(adaptation_state.cmvn_state);
 }

 BaseFloat OnlineIvectorFeature::UbmLogLikePerFrame() const {
   if (NumFrames() == 0) return 0;
   else return tot_ubm_loglike_ / NumFrames();
 }

 BaseFloat OnlineIvectorFeature::ObjfImprPerFrame() const {
   return ivector_stats_.ObjfChange(current_ivector_);
 }


 OnlineSilenceWeighting::OnlineSilenceWeighting(
     const TransitionModel &trans_model,
     const OnlineSilenceWeightingConfig &config,
     int32 frame_subsampling_factor):
     trans_model_(trans_model), config_(config),
     frame_subsampling_factor_(frame_subsampling_factor),
     num_frames_output_and_correct_(0) {
   KALDI_ASSERT(frame_subsampling_factor_ >= 1);
   std::vector<int32> silence_phones;
   SplitStringToIntegers(config.silence_phones_str, ":,", false,
                         &silence_phones);
   for (size_t i = 0; i < silence_phones.size(); i++)
     silence_phones_.insert(silence_phones[i]);
 }


 template <typename FST>
 void OnlineSilenceWeighting::ComputeCurrentTraceback(
     const LatticeFasterOnlineDecoderTpl<FST> &decoder) {
   int32 num_frames_decoded = decoder.NumFramesDecoded(),
       num_frames_prev = frame_info_.size();
   // note, num_frames_prev is not the number of frames previously decoded,
   // it's the generally-larger number of frames that we were requested to
   // provide weights for.
   if (num_frames_prev < num_frames_decoded)
     frame_info_.resize(num_frames_decoded);
   if (num_frames_prev > num_frames_decoded &&
       frame_info_[num_frames_decoded].transition_id != -1)
     KALDI_ERR << "Number of frames decoded decreased";  // Likely bug

   if (num_frames_decoded == 0)
     return;
   int32 frame = num_frames_decoded - 1;
   bool use_final_probs = false;
   typename LatticeFasterOnlineDecoderTpl<FST>::BestPathIterator iter =
       decoder.BestPathEnd(use_final_probs, NULL);
   while (frame >= 0) {
     LatticeArc arc;
     arc.ilabel = 0;
     while (arc.ilabel == 0)  // the while loop skips over input-epsilons
       iter = decoder.TraceBackBestPath(iter, &arc);
     // note, the iter.frame values are slightly unintuitively defined,
     // they are one less than you might expect.
     KALDI_ASSERT(iter.frame == frame - 1);

     if (frame_info_[frame].token == iter.tok) {
       // we know that the traceback from this point back will be identical, so
       // no point tracing back further.  Note: we are comparing memory addresses
       // of tokens of the decoder; this guarantees it's the same exact token
       // because tokens, once allocated on a frame, are only deleted, never
       // reallocated for that frame.
       break;
     }

     if (num_frames_output_and_correct_ > frame)
       num_frames_output_and_correct_ = frame;

     frame_info_[frame].token = iter.tok;
     frame_info_[frame].transition_id = arc.ilabel;
     frame--;
     // leave frame_info_.current_weight at zero for now (as set in the
     // constructor), reflecting that we haven't already output a weight for that
     // frame.
   }
 }

 template <typename FST>
 void OnlineSilenceWeighting::ComputeCurrentTraceback(
     const LatticeIncrementalOnlineDecoderTpl<FST> &decoder) {
   int32 num_frames_decoded = decoder.NumFramesDecoded(),
       num_frames_prev = frame_info_.size();
   // note, num_frames_prev is not the number of frames previously decoded,
   // it's the generally-larger number of frames that we were requested to
   // provide weights for.
   if (num_frames_prev < num_frames_decoded)
     frame_info_.resize(num_frames_decoded);
   if (num_frames_prev > num_frames_decoded &&
       frame_info_[num_frames_decoded].transition_id != -1)
     KALDI_ERR << "Number of frames decoded decreased";  // Likely bug

   if (num_frames_decoded == 0)
     return;
   int32 frame = num_frames_decoded - 1;
   bool use_final_probs = false;
   typename LatticeIncrementalOnlineDecoderTpl<FST>::BestPathIterator iter =
       decoder.BestPathEnd(use_final_probs, NULL);
   while (frame >= 0) {
     LatticeArc arc;
     arc.ilabel = 0;
     while (arc.ilabel == 0)  // the while loop skips over input-epsilons
       iter = decoder.TraceBackBestPath(iter, &arc);
     // note, the iter.frame values are slightly unintuitively defined,
     // they are one less than you might expect.
     KALDI_ASSERT(iter.frame == frame - 1);

     if (frame_info_[frame].token == iter.tok) {
       // we know that the traceback from this point back will be identical, so
       // no point tracing back further.  Note: we are comparing memory addresses
       // of tokens of the decoder; this guarantees it's the same exact token,
       // because tokens, once allocated on a frame, are only deleted, never
       // reallocated for that frame.
       break;
     }

     if (num_frames_output_and_correct_ > frame)
       num_frames_output_and_correct_ = frame;

     frame_info_[frame].token = iter.tok;
     frame_info_[frame].transition_id = arc.ilabel;
     frame--;
     // leave frame_info_.current_weight at zero for now (as set in the
     // constructor), reflecting that we haven't already output a weight for that
     // frame.
   }
 }


 // Instantiate the template OnlineSilenceWeighting::ComputeCurrentTraceback().
 template
 void OnlineSilenceWeighting::ComputeCurrentTraceback<fst::Fst<fst::StdArc> >(
     const LatticeFasterOnlineDecoderTpl<fst::Fst<fst::StdArc> > &decoder);
 template
 void OnlineSilenceWeighting::ComputeCurrentTraceback<fst::GrammarFst>(
     const LatticeFasterOnlineDecoderTpl<fst::GrammarFst> &decoder);
 template
 void OnlineSilenceWeighting::ComputeCurrentTraceback<fst::Fst<fst::StdArc> >(
     const LatticeIncrementalOnlineDecoderTpl<fst::Fst<fst::StdArc> > &decoder);
 template
 void OnlineSilenceWeighting::ComputeCurrentTraceback<fst::GrammarFst>(
     const LatticeIncrementalOnlineDecoderTpl<fst::GrammarFst> &decoder);


 void OnlineSilenceWeighting::GetDeltaWeights(
     int32 num_frames_ready, int32 first_decoder_frame,
     std::vector<std::pair<int32, BaseFloat> > *delta_weights) {
   // num_frames_ready is at the feature frame-rate, most of the code
   // in this function is at the decoder frame-rate.
   // round up, so we are sure to get weights for at least the frame
   // 'num_frames_ready - 1', and maybe one or two frames afterward.
   KALDI_ASSERT(num_frames_ready > first_decoder_frame || num_frames_ready == 0);
   int32 fs = frame_subsampling_factor_,
   num_decoder_frames_ready = (num_frames_ready - first_decoder_frame + fs - 1) / fs;

   const int32 max_state_duration = config_.max_state_duration;
   const BaseFloat silence_weight = config_.silence_weight;

   delta_weights->clear();

   int32 prev_num_frames_processed = frame_info_.size();
   if (frame_info_.size() < static_cast<size_t>(num_decoder_frames_ready))
     frame_info_.resize(num_decoder_frames_ready);

   // Don't go further backward into the past then 100 frames before the most
   // recent frame previously than 100 frames when modifying the traceback.
   // C.f. the value 200 in template
   // OnlineGenericBaseFeature<C>::OnlineGenericBaseFeature in online-feature.cc,
   // which needs to be more than this value of 100 plus the amount of context
   // that LDA might use plus the chunk size we're likely to decode in one time.
   // The user can always increase the value of --max-feature-vectors in case one
   // of these conditions is broken.  Search for ONLINE_IVECTOR_LIMIT in
   // online-feature.cc
   int32 begin_frame = std::max<int32>(0, prev_num_frames_processed - 100),
       frames_out = static_cast<int32>(frame_info_.size()) - begin_frame;
   // frames_out is the number of frames we will output.
   KALDI_ASSERT(frames_out >= 0);
   std::vector<BaseFloat> frame_weight(frames_out, 1.0);
   // we will set frame_weight to the value silence_weight for silence frames and
   // for transition-ids that repeat with duration > max_state_duration.  Frames
   // newer than the most recent traceback will get a weight equal to the weight
   // for the most recent frame in the traceback; or the silence weight, if there
   // is no traceback at all available yet.

   // First treat some special cases.
   if (frames_out == 0)  // Nothing to output.
     return;
   if (frame_info_[begin_frame].transition_id == -1) {
     // We do not have any traceback at all within the frames we are to output...
     // find the most recent weight that we output and apply the same weight to
     // all the new output; or output the silence weight, if nothing was output.
     BaseFloat weight = (begin_frame == 0 ? silence_weight :
                         frame_info_[begin_frame - 1].current_weight);
     for (int32 offset = 0; offset < frames_out; offset++)
       frame_weight[offset] = weight;
   } else {
     int32 current_run_start_offset = 0;
     for (int32 offset = 0; offset < frames_out; offset++) {
       int32 frame = begin_frame + offset;
       int32 transition_id = frame_info_[frame].transition_id;
       if (transition_id == -1) {
         // this frame does not yet have a decoder traceback, so just
         // duplicate the silence/non-silence status of the most recent
         // frame we have a traceback for (probably a reasonable guess).
         frame_weight[offset] = frame_weight[offset - 1];
       } else {
         int32 phone = trans_model_.TransitionIdToPhone(transition_id);
         bool is_silence = (silence_phones_.count(phone) != 0);
         if (is_silence)
           frame_weight[offset] = silence_weight;
         // now deal with max-duration issues.
         if (max_state_duration > 0 &&
             (offset + 1 == frames_out ||
              transition_id != frame_info_[frame + 1].transition_id)) {
           // If this is the last frame of a run...
           int32 run_length = offset - current_run_start_offset + 1;
           if (run_length >= max_state_duration) {
             // treat runs of the same transition-id longer than the max, as
             // silence, even if they were not silence.
             for (int32 offset2 = current_run_start_offset;
                  offset2 <= offset; offset2++)
               frame_weight[offset2] = silence_weight;
           }
           if (offset + 1 < frames_out)
             current_run_start_offset = offset + 1;
         }
       }
     }
   }
   // Now commit the stats...
   for (int32 offset = 0; offset < frames_out; offset++) {
     int32 frame = begin_frame + offset;
     BaseFloat old_weight = frame_info_[frame].current_weight,
         new_weight = frame_weight[offset],
         weight_diff = new_weight - old_weight;
     frame_info_[frame].current_weight = new_weight;
     // Even if the delta-weight is zero for the last frame, we provide it,
     // because the identity of the most recent frame with a weight is used in
     // some debugging/checking code.
     if (weight_diff != 0.0 || offset + 1 == frames_out) {
       KALDI_VLOG(6) << "Weight for frame " << frame << " changing from "
                     << old_weight << " to " << new_weight;
       for(int32 i = 0; i < frame_subsampling_factor_; i++) {
         int32 input_frame = first_decoder_frame + (frame * frame_subsampling_factor_) + i;
         delta_weights->push_back(std::make_pair(input_frame, weight_diff));
       }
     }
   }
 }

 }  // namespace kaldi
kaldi::OnlineIvectorExtractionConfig::max_remembered_frames
BaseFloat max_remembered_frames
Definition: online-ivector-feature.h:103

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::OnlineIvectorFeature::NumFrames
BaseFloat NumFrames() const
Definition: online-ivector-feature.h:307

kaldi::DiagGmm::Dim
int32 Dim() const
Returns the dimensionality of the Gaussian mean vectors.
Definition: diag-gmm.h:74

kaldi::OnlineIvectorExtractionConfig::cmvn_config_rxfilename
std::string cmvn_config_rxfilename
Definition: online-ivector-feature.h:60

kaldi::OnlineIvectorExtractionInfo::num_cg_iters
int32 num_cg_iters
Definition: online-ivector-feature.h:188

kaldi::IvectorExtractor::FeatDim
int32 FeatDim() const
Definition: ivector-extractor.cc:28

kaldi::OnlineIvectorEstimationStats::ObjfChange
double ObjfChange(const VectorBase< double > &ivector) const
ObjfChange returns the change in objective function *per frame* from using the default value [ prior_...
Definition: ivector-extractor.cc:758

kaldi::ReadConfigFromFile
void ReadConfigFromFile(const std::string &config_filename, C *c)
This template is provided for convenience in reading config classes from files; this is not the stand...
Definition: parse-options.h:237

kaldi::LatticeArc
fst::ArcTpl< LatticeWeight > LatticeArc
Definition: kaldi-lattice.h:40

kaldi::OnlineIvectorFeature::OnlineIvectorFeature
OnlineIvectorFeature(const OnlineIvectorExtractionInfo &info, OnlineFeatureInterface *base_feature)
Constructor.
Definition: online-ivector-feature.cc:399

kaldi::OnlineIvectorExtractionConfig::min_post
BaseFloat min_post
Definition: online-ivector-feature.h:72

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::OnlineIvectorFeature::ObjfImprPerFrame
BaseFloat ObjfImprPerFrame() const
Definition: online-ivector-feature.cc:460

kaldi::IvectorExtractor::PriorOffset
double PriorOffset() const
The distribution over iVectors, in our formulation, is not centered at zero; its first dimension has ...
Definition: ivector-extractor.h:159

kaldi::OnlineIvectorExtractionInfo::min_post
BaseFloat min_post
Definition: online-ivector-feature.h:185

kaldi::OnlineCmvnState::speaker_cmvn_stats
Matrix< double > speaker_cmvn_stats
Definition: online-feature.h:269

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::OnlineIvectorExtractionInfo
This struct contains various things that are needed (as const references) by class OnlineIvectorExtra...
Definition: online-ivector-feature.h:168

kaldi::OnlineIvectorExtractionInfo::OnlineIvectorExtractionInfo
OnlineIvectorExtractionInfo()
Definition: online-ivector-feature.cc:99

kaldi::OnlineIvectorFeature::current_ivector_
Vector< double > current_ivector_
Most recently estimated iVector, will have been estimated at the greatest time t where t <= num_frame...
Definition: online-ivector-feature.h:404

kaldi::OnlineIvectorExtractionInfo::cmvn_opts
OnlineCmvnOptions cmvn_opts
Definition: online-ivector-feature.h:173

kaldi::OnlineCmvnState::Write
void Write(std::ostream &os, bool binary) const
Definition: online-feature.cc:216

kaldi::OnlineIvectorExtractorAdaptationState::cmvn_state
OnlineCmvnState cmvn_state
Definition: online-ivector-feature.h:217

kaldi::LatticeFasterOnlineDecoderTpl::BestPathIterator::frame
int32 frame
Definition: lattice-faster-online-decoder.h:80

kaldi::OnlineIvectorExtractionInfo::extractor
IvectorExtractor extractor
Definition: online-ivector-feature.h:179

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::LatticeIncrementalOnlineDecoderTpl
LatticeIncrementalOnlineDecoderTpl is as LatticeIncrementalDecoderTpl but also supports an efficient ...
Definition: lattice-incremental-online-decoder.h:51

kaldi::LatticeFasterOnlineDecoderTpl::BestPathIterator
Definition: lattice-faster-online-decoder.h:78

kaldi::SplitStringToIntegers
bool SplitStringToIntegers(const std::string &full, const char *delim, bool omit_empty_strings, std::vector< I > *out)
Split a string (e.g.
Definition: text-utils.h:68

kaldi::OnlineIvectorExtractorAdaptationState::OnlineIvectorExtractorAdaptationState
OnlineIvectorExtractorAdaptationState(const OnlineIvectorExtractionInfo &info)
This constructor initializes adaptation-state with no prior speaker history.
Definition: online-ivector-feature.h:223

kaldi::OnlineCmvn
This class does an online version of the cepstral mean and [optionally] variance, but note that this ...
Definition: online-feature.h:321

kaldi::OnlineIvectorFeature::cmvn_
OnlineCmvn * cmvn_
Definition: online-ivector-feature.h:356

kaldi::OnlineIvectorExtractorAdaptationState
This class stores the adaptation state from the online iVector extractor, which can help you to initi...
Definition: online-ivector-feature.h:211

kaldi::VectorToPosteriorEntry
BaseFloat VectorToPosteriorEntry(const VectorBase< BaseFloat > &log_likes, int32 num_gselect, BaseFloat min_post, std::vector< std::pair< int32, BaseFloat > > *post_entry)
Given a vector of log-likelihoods (typically of Gaussians in a GMM but could be of pdf-ids)...
Definition: posterior.cc:440

kaldi::OnlineIvectorFeature::UbmLogLikePerFrame
BaseFloat UbmLogLikePerFrame() const
Definition: online-ivector-feature.cc:455

kaldi::OnlineSilenceWeightingConfig
Definition: online-ivector-feature.h:416

kaldi::OnlineIvectorFeature::PrintDiagnostics
void PrintDiagnostics() const
Definition: online-ivector-feature.cc:357

kaldi::OnlineIvectorFeature::GetAdaptationState
void GetAdaptationState(OnlineIvectorExtractorAdaptationState *adaptation_state) const
Get the adaptation state; you may want to call this before destroying this object, to get adaptation state that can be used to improve decoding of later utterances of this speaker.
Definition: online-ivector-feature.cc:386

kaldi::OnlineIvectorExtractionInfo::ivector_period
int32 ivector_period
Definition: online-ivector-feature.h:183

kaldi::OnlineCmvnState::frozen_state
Matrix< double > frozen_state
Definition: online-feature.h:279

kaldi::OnlineIvectorEstimationStats::Read
void Read(std::istream &is, bool binary)
Definition: ivector-extractor.cc:710

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::Matrix< BaseFloat >

kaldi::OnlineIvectorFeature::Dim
virtual int32 Dim() const
Dim() will return the iVector dimension.
Definition: online-ivector-feature.cc:147

kaldi::LatticeIncrementalOnlineDecoderTpl::BestPathEnd
BestPathIterator BestPathEnd(bool use_final_probs, BaseFloat *final_cost=NULL) const
This function returns an iterator that can be used to trace back the best path.
Definition: lattice-incremental-online-decoder.cc:54

kaldi::OnlineIvectorFeature::IsLastFrame
virtual bool IsLastFrame(int32 frame) const
Returns true if this is the last frame.
Definition: online-ivector-feature.cc:151

kaldi::Vector::Resize
void Resize(MatrixIndexT length, MatrixResizeType resize_type=kSetZero)
Set vector to a specified size (can be zero).
Definition: kaldi-vector.cc:190

kaldi::OnlineSpliceFrames
Definition: online-feature.h:458

kaldi::OnlineIvectorFeature::~OnlineIvectorFeature
virtual ~OnlineIvectorFeature()
Definition: online-ivector-feature.cc:377

kaldi::OnlineSpliceOptions::right_context
int32 right_context
Definition: online-feature.h:448

kaldi::OnlineIvectorFeature::UpdateStatsForFrames
void UpdateStatsForFrames(const std::vector< std::pair< int32, BaseFloat > > &frame_weights)
Definition: online-ivector-feature.cc:201

kaldi::OnlineIvectorExtractorAdaptationState::Read
void Read(std::istream &is, bool binary)
Definition: online-ivector-feature.cc:138

kaldi::OnlineIvectorExtractionConfig::global_cmvn_stats_rxfilename
std::string global_cmvn_stats_rxfilename
Definition: online-ivector-feature.h:57

kaldi::OnlineIvectorExtractionInfo::lda_mat
Matrix< BaseFloat > lda_mat
Definition: online-ivector-feature.h:170

kaldi::OnlineIvectorFeature::num_frames_stats_
int32 num_frames_stats_
num_frames_stats_ is the number of frames of data we have already accumulated from this utterance and...
Definition: online-ivector-feature.h:372

kaldi::VectorBase::Norm
Real Norm(Real p) const
Compute the p-th norm of the vector.
Definition: kaldi-vector.cc:512

kaldi::OnlineIvectorExtractionConfig::max_count
BaseFloat max_count
Definition: online-ivector-feature.h:77

kaldi::OnlineIvectorExtractionInfo::diag_ubm
DiagGmm diag_ubm
Definition: online-ivector-feature.h:178

kaldi::TransitionModel
Definition: transition-model.h:123

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

kaldi::OnlineIvectorExtractionConfig::online_cmvn_iextractor
bool online_cmvn_iextractor
Definition: online-ivector-feature.h:61

kaldi::OnlineIvectorExtractionConfig::num_gselect
int32 num_gselect
Definition: online-ivector-feature.h:70

kaldi::OnlineIvectorFeature::SetAdaptationState
void SetAdaptationState(const OnlineIvectorExtractorAdaptationState &adaptation_state)
Set the adaptation state to a particular value, e.g.
Definition: online-ivector-feature.cc:445

kaldi::OnlineIvectorEstimationStats::IvectorDim
int32 IvectorDim() const
Definition: ivector-extractor.h:337

kaldi::OnlineIvectorFeature::tot_ubm_loglike_
double tot_ubm_loglike_
The following is only needed for diagnostics.
Definition: online-ivector-feature.h:399

kaldi::OnlineIvectorFeature::lda_normalized_
OnlineFeatureInterface * lda_normalized_
Definition: online-ivector-feature.h:357

kaldi::OnlineIvectorExtractionInfo::num_gselect
int32 num_gselect
Definition: online-ivector-feature.h:184

kaldi::OnlineIvectorExtractionInfo::splice_opts
OnlineSpliceOptions splice_opts
Definition: online-ivector-feature.h:175

kaldi::VectorBase::CopyFromVec
void CopyFromVec(const VectorBase< Real > &v)
Copy data from another vector (must match own size).
Definition: kaldi-vector.cc:228

count
const size_t count
Definition: arpa-file-parser-test.cc:66

kaldi::IvectorExtractor::IvectorDim
int32 IvectorDim() const
Definition: ivector-extractor.cc:33

kaldi::OnlineIvectorExtractorAdaptationState::Write
void Write(std::ostream &os, bool binary) const
Definition: online-ivector-feature.cc:129

kaldi::OnlineIvectorFeature::ivector_stats_
OnlineIvectorEstimationStats ivector_stats_
the iVector estimation stats
Definition: online-ivector-feature.h:364

kaldi::OnlineSilenceWeighting::ComputeCurrentTraceback
void ComputeCurrentTraceback(const LatticeFasterOnlineDecoderTpl< FST > &decoder)
Definition: online-ivector-feature.cc:482

kaldi::OnlineCmvnState::Read
void Read(std::istream &is, bool binary)
Definition: online-feature.cc:227

kaldi::OnlineIvectorExtractorAdaptationState::ivector_stats
OnlineIvectorEstimationStats ivector_stats
Stats for online iVector estimation.
Definition: online-ivector-feature.h:220

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

float

kaldi::OnlineSilenceWeighting::config_
const OnlineSilenceWeightingConfig & config_
Definition: online-ivector-feature.h:527

kaldi::MatrixBase::Scale
void Scale(Real alpha)
Multiply each element with a scalar value.
Definition: kaldi-matrix.cc:1209

kaldi::LatticeFasterDecoderTpl< FST, decoder::BackpointerToken >::NumFramesDecoded
int32 NumFramesDecoded() const
Definition: lattice-faster-decoder.h:340

kaldi::ExpectToken
void ExpectToken(std::istream &is, bool binary, const char *token)
ExpectToken tries to read in the given token, and throws an exception on failure. ...
Definition: io-funcs.cc:191

kaldi::OnlineCmvn::SetState
void SetState(const OnlineCmvnState &cmvn_state)
Definition: online-feature.cc:489

kaldi::OnlineIvectorExtractionConfig::num_cg_iters
int32 num_cg_iters
Definition: online-ivector-feature.h:83

kaldi::OnlineIvectorExtractorAdaptationState::LimitFrames
void LimitFrames(BaseFloat max_remembered_frames, BaseFloat posterior_scale)
Scales down the stats if needed to ensure the number of frames in the speaker-specific CMVN stats doe...
Definition: online-ivector-feature.cc:109

kaldi::OnlineIvectorFeature::GetMinPost
BaseFloat GetMinPost(BaseFloat weight) const
Definition: online-ivector-feature.cc:188

kaldi::OnlineIvectorExtractionConfig::posterior_scale
BaseFloat posterior_scale
Definition: online-ivector-feature.h:74

kaldi::OnlineCmvnState
Struct OnlineCmvnState stores the state of CMVN adaptation between utterances (but not the state of t...
Definition: online-feature.h:266

kaldi::OnlineIvectorEstimationStats::Write
void Write(std::ostream &os, bool binary) const
Definition: ivector-extractor.cc:695

kaldi::OnlineIvectorExtractionConfig::diag_ubm_rxfilename
std::string diag_ubm_rxfilename
Definition: online-ivector-feature.h:63

kaldi::OnlineIvectorExtractionConfig::use_most_recent_ivector
bool use_most_recent_ivector
Definition: online-ivector-feature.h:91

kaldi::OnlineIvectorExtractionInfo::max_remembered_frames
BaseFloat max_remembered_frames
Definition: online-ivector-feature.h:191

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::OnlineTransform
This online-feature class implements any affine or linear transform.
Definition: online-feature.h:493

kaldi::NumFrames
int32 NumFrames(int64 num_samples, const FrameExtractionOptions &opts, bool flush)
This function returns the number of frames that we can extract from a wave file with the given number...
Definition: feature-window.cc:42

kaldi::OnlineIvectorExtractionConfig::ivector_extractor_rxfilename
std::string ivector_extractor_rxfilename
Definition: online-ivector-feature.h:64

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::LatticeIncrementalOnlineDecoderTpl::BestPathIterator::tok
void * tok
Definition: lattice-incremental-online-decoder.h:78

kaldi::OnlineIvectorExtractionInfo::Init
void Init(const OnlineIvectorExtractionConfig &config)
Definition: online-ivector-feature.cc:29

kaldi::OnlineIvectorExtractionConfig::greedy_ivector_extractor
bool greedy_ivector_extractor
Definition: online-ivector-feature.h:94

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::OnlineIvectorFeature::info_
const OnlineIvectorExtractionInfo & info_
Definition: online-ivector-feature.h:350

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::OnlineIvectorEstimationStats::Count
double Count() const
Definition: ivector-extractor.h:365

kaldi::LatticeFasterOnlineDecoderTpl
LatticeFasterOnlineDecoderTpl is as LatticeFasterDecoderTpl but also supports an efficient way to get...
Definition: lattice-faster-online-decoder.h:54

online-ivector-feature.h
This file contains code for online iVector extraction in a form compatible with OnlineFeatureInterfac...

kaldi::LatticeFasterOnlineDecoderTpl::TraceBackBestPath
BestPathIterator TraceBackBestPath(BestPathIterator iter, LatticeArc *arc) const
This function can be used in conjunction with BestPathEnd() to trace back the best path one link at a...
Definition: lattice-faster-online-decoder.cc:132

kaldi::LatticeFasterOnlineDecoderTpl::BestPathIterator::tok
void * tok
Definition: lattice-faster-online-decoder.h:79

kaldi::OnlineIvectorFeature::UpdateStatsUntilFrame
void UpdateStatsUntilFrame(int32 frame)
Definition: online-ivector-feature.cc:248

kaldi::OnlineIvectorExtractionInfo::ExpectedFeatureDim
int32 ExpectedFeatureDim() const
Definition: online-ivector-feature.cc:70

kaldi::OnlineSpliceOptions::left_context
int32 left_context
Definition: online-feature.h:447

kaldi::OnlineSilenceWeightingConfig::silence_phones_str
std::string silence_phones_str
Definition: online-ivector-feature.h:417

kaldi::LatticeIncrementalOnlineDecoderTpl::BestPathIterator::frame
int32 frame
Definition: lattice-incremental-online-decoder.h:79

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::OnlineIvectorExtractionInfo::Check
void Check() const
Definition: online-ivector-feature.cc:80

kaldi::OnlineIvectorExtractionConfig::lda_mat_rxfilename
std::string lda_mat_rxfilename
Definition: online-ivector-feature.h:56

kaldi::OnlineIvectorExtractionInfo::use_most_recent_ivector
bool use_most_recent_ivector
Definition: online-ivector-feature.h:189

kaldi::OnlineIvectorFeature::UpdateFrameWeights
void UpdateFrameWeights(const std::vector< std::pair< int32, BaseFloat > > &delta_weights)
Definition: online-ivector-feature.cc:169

kaldi::OnlineIvectorFeature::to_delete_
std::vector< OnlineFeatureInterface * > to_delete_
Definition: online-ivector-feature.h:361

kaldi::OnlineSilenceWeighting::silence_phones_
unordered_set< int32 > silence_phones_
Definition: online-ivector-feature.h:531

kaldi::OnlineIvectorFeature::GetFrame
virtual void GetFrame(int32 frame, VectorBase< BaseFloat > *feat)
Gets the feature vector for this frame.
Definition: online-ivector-feature.cc:327

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::OnlineIvectorExtractionInfo::max_count
BaseFloat max_count
Definition: online-ivector-feature.h:187

kaldi::LatticeIncrementalDecoderTpl< FST, decoder::BackpointerToken >::NumFramesDecoded
int32 NumFramesDecoded() const
Returns the number of frames decoded so far.
Definition: lattice-incremental-decoder.h:600

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::OnlineIvectorExtractionConfig::splice_config_rxfilename
std::string splice_config_rxfilename
Definition: online-ivector-feature.h:59

kaldi::OnlineSilenceWeightingConfig::max_state_duration
BaseFloat max_state_duration
Definition: online-ivector-feature.h:425

kaldi::MergePairVectorSumming
void MergePairVectorSumming(std::vector< std::pair< I, F > > *vec)
For a vector of pair<I, F> where I is an integer and F a floating-point or integer type...
Definition: stl-utils.h:288

kaldi::OnlineIvectorFeature::FrameShiftInSeconds
virtual BaseFloat FrameShiftInSeconds() const
Definition: online-ivector-feature.cc:165

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::OnlineIvectorExtractionConfig::ivector_period
int32 ivector_period
Definition: online-ivector-feature.h:69

kaldi::OnlineSilenceWeightingConfig::silence_weight
BaseFloat silence_weight
Definition: online-ivector-feature.h:421

kaldi::OnlineFeatureInterface
OnlineFeatureInterface is an interface for online feature processing (it is also usable in the offlin...
Definition: online-feature-itf.h:49

kaldi::OnlineIvectorFeature::NumFramesReady
virtual int32 NumFramesReady() const
returns the feature dimension.
Definition: online-ivector-feature.cc:160

kaldi::OnlineIvectorExtractionInfo::greedy_ivector_extractor
bool greedy_ivector_extractor
Definition: online-ivector-feature.h:190

kaldi::LatticeFasterOnlineDecoderTpl::BestPathEnd
BestPathIterator BestPathEnd(bool use_final_probs, BaseFloat *final_cost=NULL) const
This function returns an iterator that can be used to trace back the best path.
Definition: lattice-faster-online-decoder.cc:78

kaldi::OnlineIvectorExtractionConfig
This class includes configuration variables relating to the online iVector extraction, but not including configuration for the "base feature", i.e.
Definition: online-ivector-feature.h:55

kaldi::OnlineSilenceWeighting::trans_model_
const TransitionModel & trans_model_
Definition: online-ivector-feature.h:526

kaldi::OnlineIvectorFeature::UpdateStatsUntilFrameWeighted
void UpdateStatsUntilFrameWeighted(int32 frame)
Definition: online-ivector-feature.cc:281

kaldi::OnlineIvectorExtractionInfo::online_cmvn_iextractor
bool online_cmvn_iextractor
Definition: online-ivector-feature.h:174

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::OnlineIvectorExtractionInfo::global_cmvn_stats
Matrix< double > global_cmvn_stats
Definition: online-ivector-feature.h:171

kaldi::OnlineIvectorExtractionInfo::posterior_scale
BaseFloat posterior_scale
Definition: online-ivector-feature.h:186

kaldi::TransitionModel::TransitionIdToPhone
int32 TransitionIdToPhone(int32 trans_id) const
Definition: transition-model.cc:785

kaldi::LatticeIncrementalOnlineDecoderTpl::BestPathIterator
Definition: lattice-incremental-online-decoder.h:77

kaldi::OnlineSilenceWeighting::frame_info_
std::vector< FrameInfo > frame_info_
Definition: online-ivector-feature.h:551

kaldi::OnlineSilenceWeighting::num_frames_output_and_correct_
int32 num_frames_output_and_correct_
Definition: online-ivector-feature.h:561

kaldi::OnlineCacheFeature
This feature type can be used to cache its input, to avoid repetition of computation in a multi-pass ...
Definition: online-feature.h:564

kaldi::LatticeIncrementalOnlineDecoderTpl::TraceBackBestPath
BestPathIterator TraceBackBestPath(BestPathIterator iter, LatticeArc *arc) const
This function can be used in conjunction with BestPathEnd() to trace back the best path one link at a...
Definition: lattice-incremental-online-decoder.cc:108

kaldi::OnlineIvectorFeature::lda_
OnlineFeatureInterface * lda_
Definition: online-ivector-feature.h:355

kaldi::OnlineSilenceWeighting::OnlineSilenceWeighting
OnlineSilenceWeighting(const TransitionModel &trans_model, const OnlineSilenceWeightingConfig &config, int32 frame_subsampling_factor=1)
Definition: online-ivector-feature.cc:465

kaldi::OnlineSilenceWeighting::frame_subsampling_factor_
int32 frame_subsampling_factor_
Definition: online-ivector-feature.h:529

kaldi::OnlineIvectorEstimationStats::Scale
void Scale(double scale)
Scales the number of frames of stats by 0 <= scale <= 1, to make it as if we had fewer frames of adap...
Definition: ivector-extractor.cc:671

kaldi::OnlineSilenceWeighting::GetDeltaWeights
void GetDeltaWeights(int32 num_frames_ready, int32 first_decoder_frame, std::vector< std::pair< int32, BaseFloat > > *delta_weights)
Definition: online-ivector-feature.cc:597