doc/estimate-am-sgmm2_8h_source.html

 // sgmm2/estimate-am-sgmm2.h

 // Copyright 2009-2011  Microsoft Corporation;  Lukas Burget;
 //                      Saarland University (Author: Arnab Ghoshal);
 //                      Ondrej Glembek;  Yanmin Qian;
 // Copyright 2012-2013  Johns Hopkins University (Author: Daniel Povey)
 //                      Liang Lu;  Arnab Ghoshal

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_SGMM2_ESTIMATE_AM_SGMM2_H_
 #define KALDI_SGMM2_ESTIMATE_AM_SGMM2_H_ 1

 #include <string>
 #include <vector>

 #include "sgmm2/am-sgmm2.h"
 #include "gmm/model-common.h"
 #include "itf/options-itf.h"
 #include "util/kaldi-thread.h"

 namespace kaldi {

 struct MleAmSgmm2Options {
   BaseFloat tau_c;
   BaseFloat cov_floor;
   BaseFloat cov_diag_ratio;
   BaseFloat max_cond;

   bool renormalize_V;  // Renormalize the phonetic space.
   bool renormalize_N;  // Renormalize the speaker space.

   int weight_projections_iters;

   BaseFloat epsilon;
   BaseFloat max_impr_u;

   BaseFloat tau_map_M;
   int map_M_prior_iters;
   bool full_row_cov;
   bool full_col_cov;

   MleAmSgmm2Options() {
     cov_floor = 0.025;
     tau_c  = 2.0;
     cov_diag_ratio = 2.0;  // set this to very large to get diagonal-cov models.
     max_cond = 1.0e+05;
     epsilon = 1.0e-40;
     renormalize_V = true;
     renormalize_N = false;  // default to false since will invalidate spk vectors
     // on disk.
     weight_projections_iters = 3;
     max_impr_u = 0.25;

     map_M_prior_iters = 5;
     tau_map_M = 0.0;  // No MAP update by default (~500-1000 depending on prior)
     full_row_cov = false;
     full_col_cov = false;
   }

   void Register(OptionsItf *opts) {
     std::string module = "MleAmSgmm2Options: ";
     opts->Register("tau-c", &tau_c, module+
                    "Count for smoothing weight update.");
     opts->Register("cov-floor", &cov_floor, module+
                    "Covariance floor (fraction of average covariance).");
     opts->Register("cov-diag-ratio", &cov_diag_ratio, module+
                    "Minimum occ/dim ratio below which use diagonal covariances.");
     opts->Register("max-cond", &max_cond, module+"Maximum condition number used to "
                    "regularize the solution of certain quadratic auxiliary functions.");
     opts->Register("weight-projections-iters", &weight_projections_iters, module+
                    "Number for iterations for weight projection estimation.");
     opts->Register("renormalize-v", &renormalize_V, module+"If true, renormalize "
                    "the phonetic-subspace vectors to have meaningful sizes.");
     opts->Register("renormalize-n", &renormalize_N, module+"If true, renormalize "
                    "the speaker subspace to have meaningful sizes.");
     opts->Register("max-impr-u", &max_impr_u, module+"Maximum objective function "
                    "improvement per frame allowed in update of u (to "
                    "maintain stability.");

     opts->Register("tau-map-M", &tau_map_M, module+"Smoothing for MAP estimate "
                    "of M (0 means ML update).");
     opts->Register("map-M-prior-iters", &map_M_prior_iters, module+
                    "Number of iterations to estimate prior covariances for M.");
     opts->Register("full-row-cov", &full_row_cov, module+
                    "Estimate row covariance instead of using I.");
     opts->Register("full-col-cov", &full_col_cov, module+
                    "Estimate column covariance instead of using I.");
   }
 };

 class MleAmSgmm2Accs {
  public:
   explicit MleAmSgmm2Accs(BaseFloat rand_prune = 1.0e-05)
       : total_frames_(0.0), total_like_(0.0), feature_dim_(0),
         phn_space_dim_(0), spk_space_dim_(0), num_gaussians_(0),
         num_pdfs_(0), num_groups_(0), rand_prune_(rand_prune) {}

   MleAmSgmm2Accs(const AmSgmm2 &model, SgmmUpdateFlagsType flags,
                  bool have_spk_vecs,
                  BaseFloat rand_prune = 1.0e-05)
       : total_frames_(0.0), total_like_(0.0), rand_prune_(rand_prune) {
     ResizeAccumulators(model, flags, have_spk_vecs);
   }

   ~MleAmSgmm2Accs();

   void Read(std::istream &in_stream, bool binary, bool add);
   void Write(std::ostream &out_stream, bool binary) const;

   void Check(const AmSgmm2 &model, bool show_properties = true) const;

   void ResizeAccumulators(const AmSgmm2 &model, SgmmUpdateFlagsType flags,
                           bool have_spk_vecs);

   BaseFloat Accumulate(const AmSgmm2 &model,
                        const Sgmm2PerFrameDerivedVars &frame_vars,
                        int32 pdf_index, // == j2.
                        BaseFloat weight,
                        Sgmm2PerSpkDerivedVars *spk_vars);

   BaseFloat AccumulateFromPosteriors(const AmSgmm2 &model,
                                      const Sgmm2PerFrameDerivedVars &frame_vars,
                                      const Matrix<BaseFloat> &posteriors,
                                      int32 pdf_index, // == j2.
                                      Sgmm2PerSpkDerivedVars *spk_vars);

   void CommitStatsForSpk(const AmSgmm2 &model,
                          const Sgmm2PerSpkDerivedVars &spk_vars);

   void GetStateOccupancies(Vector<BaseFloat> *occs) const;
   int32 FeatureDim() const { return feature_dim_; }
   int32 PhoneSpaceDim() const { return phn_space_dim_; }
   int32 NumPdfs() const { return num_pdfs_; } // returns J2
   int32 NumGroups() const { return num_groups_; } // returns J1
   int32 NumGauss() const { return num_gaussians_; }

  private:
   std::vector< Matrix<double> > Y_;
   std::vector< Matrix<double> > Z_;
   std::vector< SpMatrix<double> > R_;
   std::vector< SpMatrix<double> > S_;

   std::vector< Matrix<double> > y_;
   std::vector< Matrix<double> > gamma_;

   std::vector< Matrix<double> > a_;

   Matrix<double> t_;

   Vector<double> a_s_;

   std::vector<SpMatrix<double> > U_;

   std::vector< Vector<double> > gamma_c_;

   Vector<double> gamma_s_;

   double total_frames_, total_like_;

   int32 feature_dim_, phn_space_dim_, spk_space_dim_;
   int32 num_gaussians_, num_pdfs_, num_groups_;

   BaseFloat rand_prune_;

   KALDI_DISALLOW_COPY_AND_ASSIGN(MleAmSgmm2Accs);
   friend class MleAmSgmm2Updater;
   friend class EbwAmSgmm2Updater;
 };

 class MleAmSgmm2Updater {
  public:
   explicit MleAmSgmm2Updater(const MleAmSgmm2Options &options)
       : options_(options) {}
   void Reconfigure(const MleAmSgmm2Options &options) {
     options_ = options;
   }

   void Update(const MleAmSgmm2Accs &accs,
               AmSgmm2 *model,
               SgmmUpdateFlagsType flags);

  private:
   friend class UpdateWClass;
   friend class UpdatePhoneVectorsClass;
   friend class EbwEstimateAmSgmm2;

   static void ComputeQ(const MleAmSgmm2Accs &accs,
                        const AmSgmm2 &model,
                        std::vector< SpMatrix<double> > *Q);

   static void ComputeSMeans(const MleAmSgmm2Accs &accs,
                             const AmSgmm2 &model,
                             std::vector< SpMatrix<double> > *S_means);
   friend class EbwAmSgmm2Updater;

   MleAmSgmm2Options options_;

   // Called from UpdatePhoneVectors; updates a subset of states
   // (relates to multi-threading).
   void UpdatePhoneVectorsInternal(const MleAmSgmm2Accs &accs,
                                   const std::vector<SpMatrix<double> > &H,
                                   const std::vector<Matrix<double> > &log_a,
                                   AmSgmm2 *model,
                                   double *auxf_impr,
                                   int32 num_threads,
                                   int32 thread_id) const;

   double UpdatePhoneVectors(const MleAmSgmm2Accs &accs,
                             const std::vector<SpMatrix<double> > &H,
                             const std::vector<Matrix<double> > &log_a,
                             AmSgmm2 *model) const;

   double UpdateM(const MleAmSgmm2Accs &accs,
                  const std::vector< SpMatrix<double> > &Q,
                  const Vector<double> &gamma_i,
                  AmSgmm2 *model);

   void RenormalizeV(const MleAmSgmm2Accs &accs, AmSgmm2 *model,
                     const Vector<double> &gamma_i,
                     const std::vector<SpMatrix<double> > &H);

   double UpdateN(const MleAmSgmm2Accs &accs, const Vector<double> &gamma_i,
                  AmSgmm2 *model);
   void RenormalizeN(const MleAmSgmm2Accs &accs, const Vector<double> &gamma_i,
                     AmSgmm2 *model);
   double UpdateVars(const MleAmSgmm2Accs &accs,
                     const std::vector< SpMatrix<double> > &S_means,
                     const Vector<double> &gamma_i,
                     AmSgmm2 *model);
   // Update for the phonetic-subspace weight projections w_i
   double UpdateW(const MleAmSgmm2Accs &accs,
                  const std::vector<Matrix<double> > &log_a,
                  const Vector<double> &gamma_i,
                  AmSgmm2 *model);
   // Update for the speaker-subspace weight projections u_i [SSGMM]
   double UpdateU(const MleAmSgmm2Accs &accs, const Vector<double> &gamma_i,
                  AmSgmm2 *model);

   static
   void UpdateWGetStats(const MleAmSgmm2Accs &accs,
                        const AmSgmm2 &model,
                        const Matrix<double> &w,
                        const std::vector<Matrix<double> > &log_a,
                        Matrix<double> *F_i,
                        Matrix<double> *g_i,
                        double *tot_like,
                        int32 num_threads,
                        int32 thread_id);

   double UpdateSubstateWeights(const MleAmSgmm2Accs &accs,
                                AmSgmm2 *model);

   static void ComputeLogA(const MleAmSgmm2Accs &accs,
                           std::vector<Matrix<double> > *log_a); // [SSGMM]

   void ComputeMPrior(AmSgmm2 *model);  // TODO(arnab): Maybe make this static?
   double MapUpdateM(const MleAmSgmm2Accs &accs,
                     const std::vector< SpMatrix<double> > &Q,
                     const Vector<double> &gamma_i, AmSgmm2 *model);

   KALDI_DISALLOW_COPY_AND_ASSIGN(MleAmSgmm2Updater);
   MleAmSgmm2Updater() {}  // Prevent unconfigured updater.
 };


 class MleSgmm2SpeakerAccs {
  public:
   MleSgmm2SpeakerAccs(const AmSgmm2 &model,
                       BaseFloat rand_prune_ = 1.0e-05);

   void Clear();

   BaseFloat Accumulate(const AmSgmm2 &model,
                        const Sgmm2PerFrameDerivedVars &frame_vars,
                        int32 pdf_index,
                        BaseFloat weight,
                        Sgmm2PerSpkDerivedVars *spk_vars);

   BaseFloat AccumulateFromPosteriors(const AmSgmm2 &model,
                                      const Sgmm2PerFrameDerivedVars &frame_vars,
                                      const Matrix<BaseFloat> &posteriors,
                                      int32 pdf_index,
                                      Sgmm2PerSpkDerivedVars *spk_vars);

   void Update(const AmSgmm2 &model,
               BaseFloat min_count,  // e.g. 100
               Vector<BaseFloat> *v_s,
               BaseFloat *objf_impr_out,
               BaseFloat *count_out);

  private:
   // Update without speaker-dependent weights (vectors u_i),
   // i.e. not symmetric SGMM (SSGMM)
   void UpdateNoU(Vector<BaseFloat> *v_s,
                  BaseFloat *objf_impr_out,
                  BaseFloat *count_out);
   // Update for SSGMM
   void UpdateWithU(const AmSgmm2 &model,
                    Vector<BaseFloat> *v_s,
                    BaseFloat *objf_impr_out,
                    BaseFloat *count_out);


   Vector<double> y_s_;
   Vector<double> gamma_s_;
   Vector<double> a_s_;

   std::vector< SpMatrix<double> > H_spk_;

   std::vector< Matrix<double> > NtransSigmaInv_;

   BaseFloat rand_prune_;
 };

 // This class, used in multi-core implementation of the updates of the "w_i"
 // quantities, was previously in estimate-am-sgmm.cc, but is being moved to the
 // header so it can be used in estimate-am-sgmm-ebw.cc.  It is responsible for
 // computing, in parallel, the F_i and g_i quantities used in the updates of
 // w_i.
 class UpdateWClass: public MultiThreadable {
  public:
   UpdateWClass(const MleAmSgmm2Accs &accs,
                const AmSgmm2 &model,
                const Matrix<double> &w,
                const std::vector<Matrix<double> > &log_a,
                Matrix<double> *F_i,
                Matrix<double> *g_i,
                double *tot_like):
       accs_(accs), model_(model), w_(w), log_a_(log_a),
       F_i_ptr_(F_i), g_i_ptr_(g_i), tot_like_ptr_(tot_like) {
     tot_like_ = 0.0;
     F_i_.Resize(F_i->NumRows(), F_i->NumCols());
     g_i_.Resize(g_i->NumRows(), g_i->NumCols());
   }

   UpdateWClass(const UpdateWClass &other) :
       MultiThreadable(other),
       accs_(other.accs_), model_(other.model_), w_(other.w_),
       log_a_(other.log_a_), F_i_ptr_(other.F_i_ptr_), g_i_ptr_(other.g_i_ptr_),
       F_i_(other.F_i_), g_i_(other.g_i_), tot_like_ptr_(other.tot_like_ptr_),
       tot_like_(0.0) { }

   ~UpdateWClass() {
     F_i_ptr_->AddMat(1.0, F_i_, kNoTrans);
     g_i_ptr_->AddMat(1.0, g_i_, kNoTrans);
     *tot_like_ptr_ += tot_like_;
   }

   inline void operator() () {
     // Note: give them local copy of the sums we're computing,
     // which will be propagated to the total sums in the destructor.
     MleAmSgmm2Updater::UpdateWGetStats(accs_, model_, w_, log_a_,
                                       &F_i_, &g_i_, &tot_like_,
                                       num_threads_, thread_id_);
   }
  private:
   const MleAmSgmm2Accs &accs_;
   const AmSgmm2 &model_;
   const Matrix<double> &w_;
   const std::vector<Matrix<double> > &log_a_;
   Matrix<double> *F_i_ptr_;
   Matrix<double> *g_i_ptr_;
   Matrix<double> F_i_;
   Matrix<double> g_i_;
   double *tot_like_ptr_;
   double tot_like_;
 };


 }  // namespace kaldi


 #endif  // KALDI_SGMM2_ESTIMATE_AM_SGMM2_H_
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::MleAmSgmm2Accs::t_
Matrix< double > t_
[SSGMM] each row is one of the t_i quantities in the less-exact version of the SSGMM update for the s...
Definition: estimate-am-sgmm2.h:205

kaldi::MleAmSgmm2Accs::gamma_c_
std::vector< Vector< double > > gamma_c_
Sub-state occupancies gamma_{jm}^{(c)} for each sub-state.
Definition: estimate-am-sgmm2.h:223

kaldi::UpdateWClass::g_i_
Matrix< double > g_i_
Definition: estimate-am-sgmm2.h:469

kaldi::AmSgmm2
Class for definition of the subspace Gmm acoustic model.
Definition: am-sgmm2.h:231

kaldi::SpMatrix< double >

kaldi::MleAmSgmm2Options::cov_floor
BaseFloat cov_floor
Floor covariance matrices Sigma_i to this times average cov.
Definition: estimate-am-sgmm2.h:44

kaldi::MleAmSgmm2Accs::num_pdfs_
int32 num_pdfs_
Definition: estimate-am-sgmm2.h:234

kaldi-thread.h

kaldi::MleAmSgmm2Accs::spk_space_dim_
int32 spk_space_dim_
Definition: estimate-am-sgmm2.h:233

kaldi::MleAmSgmm2Options::map_M_prior_iters
int map_M_prior_iters
num of iterations to update the prior of M
Definition: estimate-am-sgmm2.h:62

kaldi::UpdateWClass::tot_like_
double tot_like_
Definition: estimate-am-sgmm2.h:471

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::UpdatePhoneVectorsClass
Definition: estimate-am-sgmm2.cc:738

kaldi::UpdateWClass::UpdateWClass
UpdateWClass(const UpdateWClass &other)
Definition: estimate-am-sgmm2.h:441

kaldi::MleAmSgmm2Updater::UpdateWGetStats
static void UpdateWGetStats(const MleAmSgmm2Accs &accs, const AmSgmm2 &model, const Matrix< double > &w, const std::vector< Matrix< double > > &log_a, Matrix< double > *F_i, Matrix< double > *g_i, double *tot_like, int32 num_threads, int32 thread_id)
Called, multithreaded, inside UpdateW.
Definition: estimate-am-sgmm2.cc:1258

kaldi::MleAmSgmm2Options::tau_c
BaseFloat tau_c
Smoothing constant for sub-state weights [count to add to each one].
Definition: estimate-am-sgmm2.h:42

kaldi::MleSgmm2SpeakerAccs
Class for the accumulators required to update the speaker vectors v_s.
Definition: estimate-am-sgmm2.h:354

kaldi::MleAmSgmm2Updater::MleAmSgmm2Updater
MleAmSgmm2Updater(const MleAmSgmm2Options &options)
Definition: estimate-am-sgmm2.h:248

kaldi::MleAmSgmm2Accs::total_like_
double total_like_
Definition: estimate-am-sgmm2.h:230

kaldi::MleAmSgmm2Options::renormalize_V
bool renormalize_V
Definition: estimate-am-sgmm2.h:52

kaldi::UpdateWClass::~UpdateWClass
~UpdateWClass()
Definition: estimate-am-sgmm2.h:448

kaldi::MleAmSgmm2Accs::rand_prune_
BaseFloat rand_prune_
Definition: estimate-am-sgmm2.h:236

kaldi::MleSgmm2SpeakerAccs::a_s_
Vector< double > a_s_
a_i^{(s)}. For SSGMM.
Definition: estimate-am-sgmm2.h:406

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::MleAmSgmm2Options::epsilon
BaseFloat epsilon
very small value used to prevent SVD crashing.
Definition: estimate-am-sgmm2.h:58

kaldi::MleAmSgmm2Updater::MleAmSgmm2Updater
MleAmSgmm2Updater()
Definition: estimate-am-sgmm2.h:341

kaldi::MleSgmm2SpeakerAccs::rand_prune_
BaseFloat rand_prune_
small constant to randomly prune tiny posteriors
Definition: estimate-am-sgmm2.h:417

kaldi::Matrix< BaseFloat >

kaldi::MleAmSgmm2Accs::S_
std::vector< SpMatrix< double > > S_
S_{i}^{-}, scatter of adapted feature vectors x_{i}(t). Dim is [I][D][D].
Definition: estimate-am-sgmm2.h:188

kaldi::MleAmSgmm2Accs::gamma_
std::vector< Matrix< double > > gamma_
Gaussian occupancies gamma_{jmi} for each substate and Gaussian index, pooled over groups...
Definition: estimate-am-sgmm2.h:195

KALDI_DISALLOW_COPY_AND_ASSIGN
#define KALDI_DISALLOW_COPY_AND_ASSIGN(type)
Definition: kaldi-utils.h:121

kaldi::MleAmSgmm2Options::full_row_cov
bool full_row_cov
Estimate row covariance instead of using I.
Definition: estimate-am-sgmm2.h:63

kaldi::UpdateWClass::model_
const AmSgmm2 & model_
Definition: estimate-am-sgmm2.h:463

kaldi::UpdateWClass::F_i_ptr_
Matrix< double > * F_i_ptr_
Definition: estimate-am-sgmm2.h:466

kaldi::MleAmSgmm2Updater::options_
MleAmSgmm2Options options_
Definition: estimate-am-sgmm2.h:274

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi::MleAmSgmm2Options::cov_diag_ratio
BaseFloat cov_diag_ratio
ratio to dim below which we use diagonal. default 2, set to inf for diag.
Definition: estimate-am-sgmm2.h:46

kaldi::MleAmSgmm2Accs::U_
std::vector< SpMatrix< double > > U_
the U_i quantities from the less-exact version of the SSGMM update for the speaker weight projections...
Definition: estimate-am-sgmm2.h:217

kaldi::EbwAmSgmm2Updater
Definition: estimate-am-sgmm2-ebw.h:147

kaldi::MleAmSgmm2Options::Register
void Register(OptionsItf *opts)
Definition: estimate-am-sgmm2.h:84

options-itf.h

kaldi::MleAmSgmm2Updater::Reconfigure
void Reconfigure(const MleAmSgmm2Options &options)
Definition: estimate-am-sgmm2.h:250

kaldi::UpdateWClass
Definition: estimate-am-sgmm2.h:425

kaldi::MleAmSgmm2Options::weight_projections_iters
int weight_projections_iters
Number of iters when re-estimating weight projections "w".
Definition: estimate-am-sgmm2.h:56

kaldi::UpdateWClass::log_a_
const std::vector< Matrix< double > > & log_a_
Definition: estimate-am-sgmm2.h:465

kaldi::MleAmSgmm2Accs::Y_
std::vector< Matrix< double > > Y_
The stats which are not tied to any state.
Definition: estimate-am-sgmm2.h:182

kaldi::SgmmUpdateFlagsType
uint16 SgmmUpdateFlagsType
Bitwise OR of the above flags.
Definition: model-common.h:59

kaldi::MleAmSgmm2Options::full_col_cov
bool full_col_cov
Estimate col covariance instead of using I.
Definition: estimate-am-sgmm2.h:64

kaldi::UpdateWClass::F_i_
Matrix< double > F_i_
Definition: estimate-am-sgmm2.h:468

float

kaldi::MleAmSgmm2Accs::y_
std::vector< Matrix< double > > y_
The SGMM state specific stats.
Definition: estimate-am-sgmm2.h:192

kaldi::MleAmSgmm2Accs::MleAmSgmm2Accs
MleAmSgmm2Accs(BaseFloat rand_prune=1.0e-05)
Definition: estimate-am-sgmm2.h:121

kaldi::MleAmSgmm2Accs::PhoneSpaceDim
int32 PhoneSpaceDim() const
Definition: estimate-am-sgmm2.h:174

kaldi::MleAmSgmm2Options::renormalize_N
bool renormalize_N
Definition: estimate-am-sgmm2.h:53

am-sgmm2.h

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::MleAmSgmm2Options::max_impr_u
BaseFloat max_impr_u
max improvement per frame allowed in update of u.
Definition: estimate-am-sgmm2.h:59

kaldi::MleSgmm2SpeakerAccs::NtransSigmaInv_
std::vector< Matrix< double > > NtransSigmaInv_
N_i^T {i}^{-1}. Needed for y^{(s)}.
Definition: estimate-am-sgmm2.h:414

kaldi::UpdateWClass::g_i_ptr_
Matrix< double > * g_i_ptr_
Definition: estimate-am-sgmm2.h:467

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::MleAmSgmm2Accs::FeatureDim
int32 FeatureDim() const
Definition: estimate-am-sgmm2.h:173

kaldi::UpdateWClass::UpdateWClass
UpdateWClass(const MleAmSgmm2Accs &accs, const AmSgmm2 &model, const Matrix< double > &w, const std::vector< Matrix< double > > &log_a, Matrix< double > *F_i, Matrix< double > *g_i, double *tot_like)
Definition: estimate-am-sgmm2.h:427

kaldi::MleAmSgmm2Accs::a_
std::vector< Matrix< double > > a_
[SSGMM] These a_{jmi} quantities are dimensionally the same as the gamma quantities.
Definition: estimate-am-sgmm2.h:200

kaldi::MleSgmm2SpeakerAccs::y_s_
Vector< double > y_s_
Statistics for speaker adaptation (vectors), stored per-speaker.
Definition: estimate-am-sgmm2.h:402

kaldi::MleSgmm2SpeakerAccs::H_spk_
std::vector< SpMatrix< double > > H_spk_
The following variable does not change per speaker, it just relates to the speaker subspace...
Definition: estimate-am-sgmm2.h:411

kaldi::UpdateWClass::tot_like_ptr_
double * tot_like_ptr_
Definition: estimate-am-sgmm2.h:470

kaldi::MleAmSgmm2Accs::a_s_
Vector< double > a_s_
[SSGMM], this is a per-speaker variable storing the a_i^{(s)} quantities that we will use in order to...
Definition: estimate-am-sgmm2.h:213

kaldi::MleAmSgmm2Options::max_cond
BaseFloat max_cond
Max on condition of matrices in update beyond which we do not update.
Definition: estimate-am-sgmm2.h:50

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::MleAmSgmm2Accs::R_
std::vector< SpMatrix< double > > R_
R_{i}, quadratic term for speaker subspace estimation. Dim is [I][T][T].
Definition: estimate-am-sgmm2.h:186

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::MultiThreadable
Definition: kaldi-thread.h:67

kaldi::Sgmm2PerSpkDerivedVars
Definition: am-sgmm2.h:165

kaldi::UpdateWClass::w_
const Matrix< double > & w_
Definition: estimate-am-sgmm2.h:464

kaldi::MleAmSgmm2Accs::Z_
std::vector< Matrix< double > > Z_
Stats Z_{i} for speaker-subspace projections N. Dim is [I][D][T].
Definition: estimate-am-sgmm2.h:184

kaldi::MleAmSgmm2Options::tau_map_M
BaseFloat tau_map_M
For MAP update of the phonetic subspace M.
Definition: estimate-am-sgmm2.h:61

model-common.h

kaldi::UpdateWClass::accs_
const MleAmSgmm2Accs & accs_
Definition: estimate-am-sgmm2.h:462

kaldi::MleAmSgmm2Accs::NumGroups
int32 NumGroups() const
Definition: estimate-am-sgmm2.h:176

kaldi::MleAmSgmm2Accs::NumGauss
int32 NumGauss() const
Definition: estimate-am-sgmm2.h:177

kaldi::MleAmSgmm2Options
Configuration variables needed in the SGMM estimation process.
Definition: estimate-am-sgmm2.h:40

kaldi::MleAmSgmm2Options::MleAmSgmm2Options
MleAmSgmm2Options()
Definition: estimate-am-sgmm2.h:66

kaldi::MleAmSgmm2Accs
Class for the accumulators associated with the phonetic-subspace model parameters.
Definition: estimate-am-sgmm2.h:119

kaldi::MleSgmm2SpeakerAccs::gamma_s_
Vector< double > gamma_s_
gamma_{i}^{(s)}. Per-speaker counts for each Gaussian. Dimension is [I]
Definition: estimate-am-sgmm2.h:404

kaldi::Sgmm2PerFrameDerivedVars
Holds the per-frame precomputed quantities x(t), x_{i}(t), z_{i}(t), and n_{i}(t) (cf...
Definition: am-sgmm2.h:142

kaldi::MleAmSgmm2Accs::NumPdfs
int32 NumPdfs() const
Definition: estimate-am-sgmm2.h:175

kaldi::MleAmSgmm2Accs::gamma_s_
Vector< double > gamma_s_
gamma_{i}^{(s)}.
Definition: estimate-am-sgmm2.h:228

kaldi::MleAmSgmm2Updater
Definition: estimate-am-sgmm2.h:246

kaldi::MleAmSgmm2Accs::MleAmSgmm2Accs
MleAmSgmm2Accs(const AmSgmm2 &model, SgmmUpdateFlagsType flags, bool have_spk_vecs, BaseFloat rand_prune=1.0e-05)
Definition: estimate-am-sgmm2.h:126