doc/ivector-extractor_8h_source.html

 // ivector/ivector-extractor.h

 // Copyright 2013-2014    Daniel Povey
 //           2015         David Snyder


 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_IVECTOR_IVECTOR_EXTRACTOR_H_
 #define KALDI_IVECTOR_IVECTOR_EXTRACTOR_H_

 #include <vector>
 #include <mutex>
 #include "base/kaldi-common.h"
 #include "matrix/matrix-lib.h"
 #include "gmm/model-common.h"
 #include "gmm/diag-gmm.h"
 #include "gmm/full-gmm.h"
 #include "itf/options-itf.h"
 #include "util/common-utils.h"
 #include "hmm/posterior.h"

 namespace kaldi {

 // Note, throughout this file we use SGMM-type notation because
 // that's what I'm comfortable with.
 // Dimensions:
 //  D is the feature dim (e.g. D = 60)
 //  I is the number of Gaussians (e.g. I = 2048)
 //  S is the ivector dim (e.g. S = 400)


 // Options for estimating iVectors, during both training and test.  Note: the
 // "acoustic_weight" is not read by any class declared in this header; it has to
 // be applied by calling IvectorExtractorUtteranceStats::Scale() before
 // obtaining the iVector.
 // The same is true of max_count: it has to be applied by programs themselves
 // e.g. see ../ivectorbin/ivector-extract.cc.
 struct IvectorEstimationOptions {
   double acoustic_weight;
   double max_count;
   IvectorEstimationOptions(): acoustic_weight(1.0), max_count(0.0) {}
   void Register(OptionsItf *opts) {
     opts->Register("acoustic-weight", &acoustic_weight,
                    "Weight on part of auxf that involves the data (e.g. 0.2); "
                    "if this weight is small, the prior will have more effect.");
     opts->Register("max-count", &max_count,
                    "Maximum frame count (affects prior scaling): if >0, the prior "
                    "term will be scaled up after the frame count exceeds this "
                    "value.  Note that this count is considered after posterior "
                    "scaling (e.g. --acoustic-weight option, or scale argument to "
                    "scale-post), so you would normally use a cutoff 10 times "
                    "smaller than the corresponding number of frames.");
   }
 };


 class IvectorExtractor;
 class IvectorExtractorComputeDerivedVarsClass;

 class IvectorExtractorUtteranceStats {
  public:
   IvectorExtractorUtteranceStats(int32 num_gauss, int32 feat_dim,
                                  bool need_2nd_order_stats):
       gamma_(num_gauss), X_(num_gauss, feat_dim) {
     if (need_2nd_order_stats) {
       S_.resize(num_gauss);
       for (int32 i = 0; i < num_gauss; i++)
         S_[i].Resize(feat_dim);
     }
   }

   void AccStats(const MatrixBase<BaseFloat> &feats,
                 const Posterior &post);

   void Scale(double scale); // Used to apply acoustic scale.

   double NumFrames() { return gamma_.Sum(); }

  protected:
   friend class IvectorExtractor;
   friend class IvectorExtractorStats;
   Vector<double> gamma_; // zeroth-order stats (summed posteriors), dimension [I]
   Matrix<double> X_; // first-order stats, dimension [I][D]
   std::vector<SpMatrix<double> > S_; // 2nd-order stats, dimension [I][D][D], if
                                      // required.
 };


 struct IvectorExtractorOptions {
   int ivector_dim;
   int num_iters;
   bool use_weights;
   IvectorExtractorOptions(): ivector_dim(400), num_iters(2),
                              use_weights(true) { }
   void Register(OptionsItf *opts) {
     opts->Register("num-iters", &num_iters, "Number of iterations in "
                    "iVector estimation (>1 needed due to weights)");
     opts->Register("ivector-dim", &ivector_dim, "Dimension of iVector");
     opts->Register("use-weights", &use_weights, "If true, regress the "
                    "log-weights on the iVector");
   }
 };


 // Forward declaration.  This class is used together with IvectorExtractor to
 // compute iVectors in an online way, so we can update the estimate efficiently
 // as we add frames.
 class OnlineIvectorEstimationStats;

 // Caution: the IvectorExtractor is not the only thing required to get an
 // ivector.  We also need to get posteriors from a GMM, typically a FullGmm.
 // Typically these will be obtained in a process that involves using a DiagGmm
 // for Gaussian selection, followed by getting posteriors from the FullGmm.  To
 // keep track of these, we keep them all in the same directory,
 // e.g. final.{ubm,dubm,ie}.

 class IvectorExtractor {
  public:
   friend class IvectorExtractorStats;
   friend class OnlineIvectorEstimationStats;

   IvectorExtractor(): prior_offset_(0.0) { }

   IvectorExtractor(
       const IvectorExtractorOptions &opts,
       const FullGmm &fgmm);

   void GetIvectorDistribution(
       const IvectorExtractorUtteranceStats &utt_stats,
       VectorBase<double> *mean,
       SpMatrix<double> *var) const;

   double PriorOffset() const { return prior_offset_; }

   double GetAuxf(const IvectorExtractorUtteranceStats &utt_stats,
                  const VectorBase<double> &mean,
                  const SpMatrix<double> *var = NULL) const;

   double GetAcousticAuxf(const IvectorExtractorUtteranceStats &utt_stats,
                          const VectorBase<double> &mean,
                          const SpMatrix<double> *var = NULL) const;

   double GetPriorAuxf(const VectorBase<double> &mean,
                          const SpMatrix<double> *var = NULL) const;

   double GetAcousticAuxfVariance(
       const IvectorExtractorUtteranceStats &utt_stats) const;

   double GetAcousticAuxfMean(
       const IvectorExtractorUtteranceStats &utt_stats,
       const VectorBase<double> &mean,
       const SpMatrix<double> *var = NULL) const;

   double GetAcousticAuxfGconst(
       const IvectorExtractorUtteranceStats &utt_stats) const;

   double GetAcousticAuxfWeight(
       const IvectorExtractorUtteranceStats &utt_stats,
       const VectorBase<double> &mean,
       const SpMatrix<double> *var = NULL) const;


   void GetIvectorDistMean(
       const IvectorExtractorUtteranceStats &utt_stats,
       VectorBase<double> *linear,
       SpMatrix<double> *quadratic) const;

   void GetIvectorDistPrior(
       const IvectorExtractorUtteranceStats &utt_stats,
       VectorBase<double> *linear,
       SpMatrix<double> *quadratic) const;

   void GetIvectorDistWeight(
       const IvectorExtractorUtteranceStats &utt_stats,
       const VectorBase<double> &mean,
       VectorBase<double> *linear,
       SpMatrix<double> *quadratic) const;

   // Note: the function GetStats no longer exists due to code refactoring.
   // Instead of this->GetStats(feats, posterior, &utt_stats), call
   // utt_stats.AccStats(feats, posterior).

   int32 FeatDim() const;
   int32 IvectorDim() const;
   int32 NumGauss() const;
   bool IvectorDependentWeights() const { return w_.NumRows() != 0; }
   void Write(std::ostream &os, bool binary) const;
   void Read(std::istream &is, bool binary);

   // Note: we allow the default assignment and copy operators
   // because they do what we want.
  protected:
   void ComputeDerivedVars();
   void ComputeDerivedVars(int32 i);
   friend class IvectorExtractorComputeDerivedVarsClass;

   // Imagine we'll project the iVectors with transformation T, so apply T^{-1}
   // where necessary to keep the model equivalent.  Used to keep unit variance
   // (like prior re-estimation).
   void TransformIvectors(const MatrixBase<double> &T,
                          double new_prior_offset);


   Matrix<double> w_;

   Vector<double> w_vec_;

   std::vector<Matrix<double> > M_;

   std::vector<SpMatrix<double> > Sigma_inv_;

   double prior_offset_;

   // Below are *derived variables* that can be computed from the
   // variables above.

   Vector<double> gconsts_;

   Matrix<double> U_;

   std::vector<Matrix<double> > Sigma_inv_M_;
  private:
   // var <-- quadratic_term^{-1}, but done carefully, first flooring eigenvalues
   // of quadratic_term to 1.0, which mathematically is the least they can be,
   // due to the prior term.
   static void InvertWithFlooring(const SpMatrix<double> &quadratic_term,
                                  SpMatrix<double> *var);
 };

 class OnlineIvectorEstimationStats {
  public:
   // Search above for max_count to see an explanation; if nonzero, it will
   // put a higher weight on the prior (vs. the stats) once the count passes
   // that value.
   OnlineIvectorEstimationStats(int32 ivector_dim,
                                BaseFloat prior_offset,
                                BaseFloat max_count);

   OnlineIvectorEstimationStats(const OnlineIvectorEstimationStats &other);


   // Accumulate stats for one frame.
   void AccStats(const IvectorExtractor &extractor,
                 const VectorBase<BaseFloat> &feature,
                 const std::vector<std::pair<int32, BaseFloat> > &gauss_post);

   // Accumulate stats for a sequence (or collection) of frames.
   void AccStats(const IvectorExtractor &extractor,
                 const MatrixBase<BaseFloat> &features,
                 const std::vector<std::vector<std::pair<int32, BaseFloat> > > &gauss_post);


   int32 IvectorDim() const { return linear_term_.Dim(); }

   void GetIvector(int32 num_cg_iters,
                   VectorBase<double> *ivector) const;

   double NumFrames() const { return num_frames_; }

   double PriorOffset() const { return prior_offset_; }

   double ObjfChange(const VectorBase<double> &ivector) const;

   double Count() const { return num_frames_; }

   void Scale(double scale);

   void Write(std::ostream &os, bool binary) const;
   void Read(std::istream &is, bool binary);

   // Override the default assignment operator
   inline OnlineIvectorEstimationStats &operator=(const OnlineIvectorEstimationStats &other) {
     this->prior_offset_ = other.prior_offset_;
     this->max_count_ = other.max_count_;
     this->num_frames_ = other.num_frames_;
     this->quadratic_term_=other.quadratic_term_;
     this->linear_term_=other.linear_term_;
     return *this;
   }

  protected:
   double Objf(const VectorBase<double> &ivector) const;

   double DefaultObjf() const;

   friend class IvectorExtractor;
   double prior_offset_;
   double max_count_;
   double num_frames_;  // num frames (weighted, if applicable).
   SpMatrix<double> quadratic_term_;
   Vector<double> linear_term_;
 };


 // This code obtains periodically (for each "ivector_period" frames, e.g. 10
 // frames), an estimate of the iVector including all frames up to that point.
 // This emulates what you could do in an online/streaming algorithm; its use is
 // for neural network training in a way that's matched to online decoding.
 // [note: I don't believe we are currently using the program,
 // ivector-extract-online.cc, that calls this function, in any of the scripts.].
 // Caution: this program outputs the raw iVectors, where the first component
 // will generally be very positive.  You probably want to subtract PriorOffset()
 // from the first element of each row of the output before writing it out.
 // For num_cg_iters, we suggest 15.  It can be a positive number (more -> more
 // exact, less -> faster), or if it's negative it will do the optimization
 // exactly each time which is slower.
 // It returns the objective function improvement per frame from the "default" iVector to
 // the last iVector estimated.
 double EstimateIvectorsOnline(
     const Matrix<BaseFloat> &feats,
     const Posterior &post,
     const IvectorExtractor &extractor,
     int32 ivector_period,
     int32 num_cg_iters,
     BaseFloat max_count,
     Matrix<BaseFloat> *ivectors);


 struct IvectorExtractorStatsOptions {
   bool update_variances;
   bool compute_auxf;
   int32 num_samples_for_weights;
   int cache_size;

   IvectorExtractorStatsOptions(): update_variances(true),
                          compute_auxf(true),
                          num_samples_for_weights(10),
                          cache_size(100) { }
   void Register(OptionsItf *opts) {
     opts->Register("update-variances", &update_variances, "If true, update the "
                    "Gaussian variances");
     opts->Register("compute-auxf", &compute_auxf, "If true, compute the "
                    "auxiliary functions on training data; can be used to "
                    "debug and check convergence.");
     opts->Register("num-samples-for-weights", &num_samples_for_weights,
                    "Number of samples from iVector distribution to use "
                    "for accumulating stats for weight update.  Must be >1");
     opts->Register("cache-size", &cache_size, "Size of an internal "
                    "cache (not critical, only affects speed/memory)");
   }
 };


 struct IvectorExtractorEstimationOptions {
   double variance_floor_factor;
   double gaussian_min_count;
   int32 num_threads;
   bool diagonalize;
   IvectorExtractorEstimationOptions(): variance_floor_factor(0.1),
                                        gaussian_min_count(100.0),
                                        diagonalize(true) { }
   void Register(OptionsItf *opts) {
     opts->Register("variance-floor-factor", &variance_floor_factor,
                    "Factor that determines variance flooring (we floor each covar "
                    "to this times global average covariance");
     opts->Register("gaussian-min-count", &gaussian_min_count,
                    "Minimum total count per Gaussian, below which we refuse to "
                    "update any associated parameters.");
     opts->Register("diagonalize", &diagonalize,
                    "If true, diagonalize the quadratic term in the "
                    "objective function. This reorders the ivector dimensions "
                    "from most to least important.");
   }
 };

 class IvectorExtractorUpdateProjectionClass;
 class IvectorExtractorUpdateWeightClass;

 class IvectorExtractorStats {
  public:
   friend class IvectorExtractor;

   IvectorExtractorStats(): tot_auxf_(0.0), R_num_cached_(0), num_ivectors_(0) { }

   IvectorExtractorStats(const IvectorExtractor &extractor,
                         const IvectorExtractorStatsOptions &stats_opts);

   void Add(const IvectorExtractorStats &other);

   void AccStatsForUtterance(const IvectorExtractor &extractor,
                             const MatrixBase<BaseFloat> &feats,
                             const Posterior &post);

   // This version (intended mainly for testing) works out the Gaussian
   // posteriors from the model.  Returns total log-like for feats, given
   // unadapted fgmm.  You'd want to add Gaussian pruning and preselection using
   // the diagonal, GMM, for speed, if you used this outside testing code.
   double AccStatsForUtterance(const IvectorExtractor &extractor,
                               const MatrixBase<BaseFloat> &feats,
                               const FullGmm &fgmm);

   void Read(std::istream &is, bool binary, bool add = false);

   void Write(std::ostream &os, bool binary); // non-const version; relates to cache.

   // const version of Write; may use extra memory if we have stuff cached
   void Write(std::ostream &os, bool binary) const;

   double Update(const IvectorExtractorEstimationOptions &opts,
                 IvectorExtractor *extractor) const;

   double AuxfPerFrame() { return tot_auxf_ / gamma_.Sum(); }

   void IvectorVarianceDiagnostic(const IvectorExtractor &extractor);

   // Copy constructor.
   explicit IvectorExtractorStats (const IvectorExtractorStats &other);

  protected:
   friend class IvectorExtractorUpdateProjectionClass;
   friend class IvectorExtractorUpdateWeightClass;


   // This is called by AccStatsForUtterance
   void CommitStatsForUtterance(const IvectorExtractor &extractor,
                                const IvectorExtractorUtteranceStats &utt_stats);

   void CommitStatsForM(const IvectorExtractor &extractor,
                        const IvectorExtractorUtteranceStats &utt_stats,
                        const VectorBase<double> &ivec_mean,
                        const SpMatrix<double> &ivec_var);

   void FlushCache();

   void CommitStatsForSigma(const IvectorExtractor &extractor,
                            const IvectorExtractorUtteranceStats &utt_stats);

   void CommitStatsForWPoint(const IvectorExtractor &extractor,
                             const IvectorExtractorUtteranceStats &utt_stats,
                             const VectorBase<double> &ivector,
                             double weight);


   void CommitStatsForW(const IvectorExtractor &extractor,
                        const IvectorExtractorUtteranceStats &utt_stats,
                        const VectorBase<double> &ivec_mean,
                        const SpMatrix<double> &ivec_var);

   void CommitStatsForPrior(const VectorBase<double> &ivec_mean,
                            const SpMatrix<double> &ivec_var);

   // Updates M.  Returns the objf improvement per frame.
   double UpdateProjections(const IvectorExtractorEstimationOptions &opts,
                            IvectorExtractor *extractor) const;

   // This internally called function returns the objf improvement
   // for this Gaussian index.  Updates one M.
   double UpdateProjection(const IvectorExtractorEstimationOptions &opts,
                           int32 gaussian,
                           IvectorExtractor *extractor) const;

   // Updates the weight projections.  Returns the objf improvement per
   // frame.
   double UpdateWeights(const IvectorExtractorEstimationOptions &opts,
                        IvectorExtractor *extractor) const;

   // Updates the weight projection for one Gaussian index.  Returns the objf
   // improvement for this index.
   double UpdateWeight(const IvectorExtractorEstimationOptions &opts,
                       int32 gaussian,
                       IvectorExtractor *extractor) const;

   // Returns the objf improvement per frame.
   double UpdateVariances(const IvectorExtractorEstimationOptions &opts,
                          IvectorExtractor *extractor) const;


   // Updates the prior; returns obj improvement per frame.
   double UpdatePrior(const IvectorExtractorEstimationOptions &opts,
                      IvectorExtractor *extractor) const;

   // Called from UpdatePrior, separating out some code that
   // computes likelihood changes.
   double PriorDiagnostics(double old_prior_offset) const;


   void CheckDims(const IvectorExtractor &extractor) const;

   IvectorExtractorStatsOptions config_;

   double tot_auxf_;

   std::mutex gamma_Y_lock_;

   Vector<double> gamma_;

   std::vector<Matrix<double> > Y_;

   std::mutex R_lock_;

   Matrix<double> R_;

   std::mutex R_cache_lock_;

   int32 R_num_cached_;
   Matrix<double> R_gamma_cache_;
   Matrix<double> R_ivec_scatter_cache_;

   std::mutex weight_stats_lock_;

   Matrix<double> Q_;

   Matrix<double> G_;

   std::mutex variance_stats_lock_;

   std::vector< SpMatrix<double> > S_;


   std::mutex prior_stats_lock_;

   double num_ivectors_;

   Vector<double> ivector_sum_;

   SpMatrix<double> ivector_scatter_;

  private:
   void GetOrthogonalIvectorTransform(const SubMatrix<double> &T,
                                      IvectorExtractor *extractor,
                                      Matrix<double> *A) const;

   IvectorExtractorStats &operator = (const IvectorExtractorStats &other);  // Disallow.
 };


 }  // namespace kaldi


 #endif
kaldi::IvectorExtractorUtteranceStats::gamma_
Vector< double > gamma_
Definition: ivector-extractor.h:101

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::IvectorExtractorStats::R_num_cached_
int32 R_num_cached_
To avoid too-frequent rank-1 update of R, which is slow, we cache some quantities here...
Definition: ivector-extractor.h:638

kaldi::IvectorExtractor::IvectorExtractor
IvectorExtractor()
Definition: ivector-extractor.h:141

kaldi::IvectorEstimationOptions::IvectorEstimationOptions
IvectorEstimationOptions()
Definition: ivector-extractor.h:56

kaldi::SpMatrix< double >

kaldi::IvectorExtractorUpdateProjectionClass
Definition: ivector-extractor.cc:1394

kaldi::OnlineIvectorEstimationStats::num_frames_
double num_frames_
Definition: ivector-extractor.h:396

kaldi::IvectorExtractorStats::R_cache_lock_
std::mutex R_cache_lock_
This mutex guards R_num_cached_, R_gamma_cache_, R_ivec_cache_ (for multi-threaded update) ...
Definition: ivector-extractor.h:634

kaldi::IvectorExtractor::PriorOffset
double PriorOffset() const
The distribution over iVectors, in our formulation, is not centered at zero; its first dimension has ...
Definition: ivector-extractor.h:159

kaldi::IvectorExtractorStatsOptions::compute_auxf
bool compute_auxf
Definition: ivector-extractor.h:430

diag-gmm.h

kaldi::IvectorExtractorUpdateWeightClass
Definition: ivector-extractor.cc:1567

matrix-lib.h

kaldi::IvectorEstimationOptions::max_count
double max_count
Definition: ivector-extractor.h:55

kaldi::IvectorExtractor::U_
Matrix< double > U_
U_i = M_i^T ^{-1} M_i is a quantity that comes up in ivector estimation.
Definition: ivector-extractor.h:298

kaldi::OnlineIvectorEstimationStats::max_count_
double max_count_
Definition: ivector-extractor.h:395

kaldi::IvectorEstimationOptions::Register
void Register(OptionsItf *opts)
Definition: ivector-extractor.h:57

kaldi::OnlineIvectorEstimationStats::NumFrames
double NumFrames() const
Definition: ivector-extractor.h:355

kaldi::MatrixBase
Base class which provides matrix operations not involving resizing or allocation. ...
Definition: kaldi-matrix.h:49

kaldi::IvectorExtractor::w_vec_
Vector< double > w_vec_
If we are not using weight-projection vectors, stores the Gaussian mixture weights from the UBM...
Definition: ivector-extractor.h:270

kaldi::IvectorExtractor::IvectorDependentWeights
bool IvectorDependentWeights() const
Definition: ivector-extractor.h:245

kaldi::IvectorExtractorOptions::IvectorExtractorOptions
IvectorExtractorOptions()
Definition: ivector-extractor.h:112

kaldi::FullGmm
Definition for Gaussian Mixture Model with full covariances.
Definition: full-gmm.h:40

kaldi::IvectorExtractorOptions::use_weights
bool use_weights
Definition: ivector-extractor.h:111

kaldi::IvectorExtractorStats::R_ivec_scatter_cache_
Matrix< double > R_ivec_scatter_cache_
dimension: [num-to-cache][S*(S+1)/2]
Definition: ivector-extractor.h:642

kaldi::IvectorExtractorEstimationOptions::Register
void Register(OptionsItf *opts)
Definition: ivector-extractor.h:462

kaldi::IvectorExtractorStats::R_lock_
std::mutex R_lock_
This mutex guards R_ (for multi-threaded update)
Definition: ivector-extractor.h:623

kaldi::IvectorExtractorStats
IvectorExtractorStats is a class used to update the parameters of the ivector extractor.
Definition: ivector-extractor.h:481

kaldi::IvectorExtractorStatsOptions::update_variances
bool update_variances
Definition: ivector-extractor.h:429

kaldi::IvectorExtractorOptions::ivector_dim
int ivector_dim
Definition: ivector-extractor.h:109

kaldi::IvectorExtractorEstimationOptions::num_threads
int32 num_threads
Definition: ivector-extractor.h:457

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::IvectorExtractorStats::R_gamma_cache_
Matrix< double > R_gamma_cache_
dimension: [num-to-cache][I]
Definition: ivector-extractor.h:640

kaldi::OnlineIvectorEstimationStats
This class helps us to efficiently estimate iVectors in situations where the data is coming in frame ...
Definition: ivector-extractor.h:314

kaldi::Matrix< double >

kaldi::IvectorExtractorStatsOptions::Register
void Register(OptionsItf *opts)
Definition: ivector-extractor.h:438

kaldi::IvectorExtractorStats::tot_auxf_
double tot_auxf_
Caution: if we read from disk, this.
Definition: ivector-extractor.h:610

kaldi::IvectorExtractorStats::ivector_sum_
Vector< double > ivector_sum_
Sum of all the iVector means. Needed for prior re-estimation.
Definition: ivector-extractor.h:673

posterior.h

kaldi::IvectorExtractor
Definition: ivector-extractor.h:136

kaldi::IvectorExtractor::Sigma_inv_M_
std::vector< Matrix< double > > Sigma_inv_M_
The product of Sigma_inv_[i] with M_[i].
Definition: ivector-extractor.h:301

kaldi::IvectorExtractorStatsOptions::cache_size
int cache_size
Definition: ivector-extractor.h:432

kaldi::IvectorExtractorStats::G_
Matrix< double > G_
G_ is the linear term in the weight projection matrix w_.
Definition: ivector-extractor.h:654

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi::OnlineIvectorEstimationStats::IvectorDim
int32 IvectorDim() const
Definition: ivector-extractor.h:337

options-itf.h

full-gmm.h

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::IvectorExtractorStats::R_
Matrix< double > R_
R_i, quadratic term for ivector subspace (M matrix)estimation.
Definition: ivector-extractor.h:630

kaldi::IvectorExtractorStatsOptions
Options for IvectorExtractorStats, which is used to update the parameters of IvectorExtractor.
Definition: ivector-extractor.h:428

float

kaldi::OnlineIvectorEstimationStats::prior_offset_
double prior_offset_
Definition: ivector-extractor.h:394

kaldi::IvectorExtractorUtteranceStats::IvectorExtractorUtteranceStats
IvectorExtractorUtteranceStats(int32 num_gauss, int32 feat_dim, bool need_2nd_order_stats)
Definition: ivector-extractor.h:81

kaldi::IvectorExtractorUtteranceStats::NumFrames
double NumFrames()
Definition: ivector-extractor.h:96

kaldi::IvectorExtractorStats::IvectorExtractorStats
IvectorExtractorStats()
Definition: ivector-extractor.h:485

kaldi::IvectorExtractorStats::config_
IvectorExtractorStatsOptions config_
Definition: ivector-extractor.h:603

kaldi::OnlineIvectorEstimationStats::PriorOffset
double PriorOffset() const
Definition: ivector-extractor.h:357

kaldi::IvectorExtractorStats::Q_
Matrix< double > Q_
Q_ is like R_ (with same dimensions), except used for weight estimation; the scatter of ivectors is w...
Definition: ivector-extractor.h:650

kaldi::IvectorExtractorStats::AuxfPerFrame
double AuxfPerFrame()
Definition: ivector-extractor.h:515

kaldi::IvectorExtractor::Sigma_inv_
std::vector< SpMatrix< double > > Sigma_inv_
Inverse variances of speaker-adapted model, dimension [I][D][D].
Definition: ivector-extractor.h:279

kaldi::IvectorExtractorStats::ivector_scatter_
SpMatrix< double > ivector_scatter_
Second-order stats for the iVectors. Needed for prior re-estimation.
Definition: ivector-extractor.h:676

kaldi::IvectorExtractorStats::num_ivectors_
double num_ivectors_
Count of the number of iVectors we trained on.
Definition: ivector-extractor.h:670

kaldi::IvectorExtractorEstimationOptions::variance_floor_factor
double variance_floor_factor
Definition: ivector-extractor.h:455

kaldi::IvectorExtractorEstimationOptions::diagonalize
bool diagonalize
Definition: ivector-extractor.h:458

kaldi::IvectorExtractor::M_
std::vector< Matrix< double > > M_
Ivector-subspace projection matrices, dimension is [I][D][S].
Definition: ivector-extractor.h:276

kaldi::IvectorExtractorUtteranceStats::S_
std::vector< SpMatrix< double > > S_
Definition: ivector-extractor.h:103

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::OnlineIvectorEstimationStats::Count
double Count() const
Definition: ivector-extractor.h:365

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::IvectorExtractorStats::weight_stats_lock_
std::mutex weight_stats_lock_
This mutex guards Q_ and G_ (for multi-threaded update)
Definition: ivector-extractor.h:645

kaldi::EstimateIvectorsOnline
double EstimateIvectorsOnline(const Matrix< BaseFloat > &feats, const Posterior &post, const IvectorExtractor &extractor, int32 ivector_period, int32 num_cg_iters, BaseFloat max_count, Matrix< BaseFloat > *ivectors)
Definition: ivector-extractor.cc:1778

kaldi::TransformIvectors
void TransformIvectors(const Matrix< BaseFloat > &ivectors_in, const PldaConfig &plda_config, const Plda &plda, Matrix< BaseFloat > *ivectors_out)
Definition: ivector-plda-scoring-dense.cc:87

kaldi::IvectorExtractorOptions::Register
void Register(OptionsItf *opts)
Definition: ivector-extractor.h:114

kaldi::OnlineIvectorEstimationStats::quadratic_term_
SpMatrix< double > quadratic_term_
Definition: ivector-extractor.h:397

kaldi::Vector< double >

kaldi::IvectorExtractorStats::variance_stats_lock_
std::mutex variance_stats_lock_
This mutex guards S_ (for multi-threaded update)
Definition: ivector-extractor.h:657

kaldi::IvectorExtractorStatsOptions::IvectorExtractorStatsOptions
IvectorExtractorStatsOptions()
Definition: ivector-extractor.h:434

kaldi::IvectorExtractorStats::Y_
std::vector< Matrix< double > > Y_
Stats Y_i for estimating projections M.
Definition: ivector-extractor.h:620

kaldi::OnlineIvectorEstimationStats::linear_term_
Vector< double > linear_term_
Definition: ivector-extractor.h:398

kaldi::IvectorExtractorStatsOptions::num_samples_for_weights
int32 num_samples_for_weights
Definition: ivector-extractor.h:431

kaldi::IvectorExtractorEstimationOptions
Options for training the IvectorExtractor, e.g. variance flooring.
Definition: ivector-extractor.h:454

kaldi::IvectorExtractor::gconsts_
Vector< double > gconsts_
The constant term in the log-likelihood of each Gaussian (not counting any weight).
Definition: ivector-extractor.h:291

kaldi::IvectorEstimationOptions::acoustic_weight
double acoustic_weight
Definition: ivector-extractor.h:54

kaldi::AccStatsForUtterance
void AccStatsForUtterance(const TransitionModel &trans_model, const AmDiagGmm &am_gmm, const GaussPost &gpost, const Matrix< BaseFloat > &feats, FmllrRawAccs *accs)
Definition: gmm-est-fmllr-raw-gpost.cc:31

model-common.h

kaldi::IvectorExtractorOptions::num_iters
int num_iters
Definition: ivector-extractor.h:110

kaldi::IvectorExtractorStats::prior_stats_lock_
std::mutex prior_stats_lock_
This mutex guards num_ivectors_, ivector_sum_ and ivector_scatter_ (for multi-threaded update) ...
Definition: ivector-extractor.h:666

kaldi::IvectorExtractorUtteranceStats
These are the stats for a particular utterance, i.e.
Definition: ivector-extractor.h:79

kaldi::IvectorExtractor::prior_offset_
double prior_offset_
1st dim of the prior over the ivector has an offset, so it is not zero.
Definition: ivector-extractor.h:284

kaldi::IvectorExtractorEstimationOptions::IvectorExtractorEstimationOptions
IvectorExtractorEstimationOptions()
Definition: ivector-extractor.h:459

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::IvectorExtractor::w_
Matrix< double > w_
Weight projection vectors, if used. Dimension is [I][S].
Definition: ivector-extractor.h:264

kaldi::IvectorExtractorStats::gamma_
Vector< double > gamma_
Total occupation count for each Gaussian index (zeroth-order stats)
Definition: ivector-extractor.h:616

kaldi-common.h

kaldi::SubMatrix
Sub-matrix representation.
Definition: kaldi-matrix.h:988

kaldi::IvectorExtractorEstimationOptions::gaussian_min_count
double gaussian_min_count
Definition: ivector-extractor.h:456

kaldi::IvectorExtractorUtteranceStats::X_
Matrix< double > X_
Definition: ivector-extractor.h:102

kaldi::IvectorEstimationOptions
Definition: ivector-extractor.h:53

kaldi::IvectorExtractorStats::S_
std::vector< SpMatrix< double > > S_
S_{i}, raw second-order stats per Gaussian which we will use to update the variances Sigma_inv_...
Definition: ivector-extractor.h:661

kaldi::OnlineIvectorEstimationStats::operator=
OnlineIvectorEstimationStats & operator=(const OnlineIvectorEstimationStats &other)
Definition: ivector-extractor.h:376

kaldi::IvectorExtractorStats::gamma_Y_lock_
std::mutex gamma_Y_lock_
This mutex guards gamma_ and Y_ (for multi-threaded update)
Definition: ivector-extractor.h:613

kaldi::IvectorExtractorOptions
Definition: ivector-extractor.h:108

kaldi::IvectorExtractorComputeDerivedVarsClass
Definition: ivector-extractor.cc:171