doc/mle-full-gmm-test_8cc_source.html

 // gmm/mle-full-gmm-test.cc

 // Copyright 2009-2011  Jan Silovsky;  Saarland University;
 //                      Microsoft Corporation;   Yanmin Qian;  Georg Stemmer

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "gmm/full-gmm.h"
 #include "gmm/diag-gmm.h"
 #include "gmm/model-common.h"
 #include "gmm/mle-full-gmm.h"
 #include "gmm/mle-diag-gmm.h"
 #include "util/stl-utils.h"
 #include "util/kaldi-io.h"

 using namespace kaldi;

 void TestComponentAcc(const FullGmm &gmm, const Matrix<BaseFloat> &feats) {
   MleFullGmmOptions config;
   AccumFullGmm est_atonce;    // updates all components
   AccumFullGmm est_compwise;  // updates single components

   // Initialize estimators
   est_atonce.Resize(gmm.NumGauss(), gmm.Dim(), kGmmAll);
   est_atonce.SetZero(kGmmAll);
   est_compwise.Resize(gmm.NumGauss(),
       gmm.Dim(), kGmmAll);
   est_compwise.SetZero(kGmmAll);

   // accumulate estimators
   for (int32 i = 0; i < feats.NumRows(); i++) {
     est_atonce.AccumulateFromFull(gmm, feats.Row(i), 1.0F);
     Vector<BaseFloat> post(gmm.NumGauss());
     gmm.ComponentPosteriors(feats.Row(i), &post);
     for (int32 m = 0; m < gmm.NumGauss(); m++) {
       est_compwise.AccumulateForComponent(feats.Row(i), m, post(m));
     }
   }

   FullGmm gmm_atonce;    // model with all components accumulated together
   FullGmm gmm_compwise;  // model with each component accumulated separately
   gmm_atonce.Resize(gmm.NumGauss(), gmm.Dim());
   gmm_compwise.Resize(gmm.NumGauss(), gmm.Dim());

   MleFullGmmUpdate(config, est_atonce, kGmmAll, &gmm_atonce, NULL, NULL);
   MleFullGmmUpdate(config, est_compwise, kGmmAll, &gmm_compwise, NULL, NULL);

   // the two ways of updating should result in the same model
   double loglike0 = 0.0;
   double loglike1 = 0.0;
   double loglike2 = 0.0;
   for (int32 i = 0; i < feats.NumRows(); i++) {
     loglike0 += static_cast<double>(gmm.LogLikelihood(feats.Row(i)));
     loglike1 += static_cast<double>(gmm_atonce.LogLikelihood(feats.Row(i)));
     loglike2 += static_cast<double>(gmm_compwise.LogLikelihood(feats.Row(i)));
   }

   std::cout << "Per-frame log-likelihood before update = "
       << (loglike0/feats.NumRows()) << '\n';
   std::cout << "Per-frame log-likelihood (accumulating at once) = "
       << (loglike1/feats.NumRows()) << '\n';
   std::cout << "Per-frame log-likelihood (accumulating component-wise) = "
       << (loglike2/feats.NumRows()) << '\n';

   AssertEqual(loglike1, loglike2, 1.0e-6);

   if (est_atonce.NumGauss() != gmm.NumGauss()) {
     KALDI_WARN << "Unable to pass test_update_flags() test because of "
       "component removal during Update() call (this is normal)";
     return;
   } else {
     KALDI_ASSERT(loglike1 >= loglike0 - (std::abs(loglike1)+std::abs(loglike0))*1.0e-06);
     KALDI_ASSERT(loglike2 >= loglike0 - (std::abs(loglike2)+std::abs(loglike0))*1.0e-06);
   }
 }

 void rand_posdef_spmatrix(size_t dim, SpMatrix<BaseFloat> *matrix,
                           TpMatrix<BaseFloat> *matrix_sqrt = NULL,
                           BaseFloat *logdet = NULL) {
   // generate random (non-singular) matrix
   Matrix<BaseFloat> tmp(dim, dim);
   while (1) {
     tmp.SetRandn();
     if (tmp.Cond() < 100) break;
     std::cout << "Condition number of random matrix large "
       << static_cast<float>(tmp.Cond()) << ", trying again (this is normal)"
       << '\n';
   }
   // tmp * tmp^T will give positive definite matrix
   matrix->AddMat2(1.0, tmp, kNoTrans, 0.0);

   if (matrix_sqrt != NULL) matrix_sqrt->Cholesky(*matrix);
   if (logdet != NULL) *logdet = matrix->LogPosDefDet();
   if ((matrix_sqrt == NULL) && (logdet == NULL)) {
     TpMatrix<BaseFloat> sqrt(dim);
     sqrt.Cholesky(*matrix);
   }
 }

 BaseFloat GetLogLikeTest(const FullGmm &gmm,
                          const VectorBase<BaseFloat> &feats,
                          bool print_eigs) {
   BaseFloat log_like_sum = -1.0e+10;
   Matrix<BaseFloat> means;
   gmm.GetMeans(&means);
   const std::vector<SpMatrix<BaseFloat> > inv_covars = gmm.inv_covars();

   if (print_eigs)
     for (size_t i = 0; i < inv_covars.size(); i++) {
       SpMatrix<BaseFloat> cov(inv_covars[i]);
       size_t dim = cov.NumRows();
       cov.Invert();
       std::cout << i << "'th component eigs are: ";
       Vector<BaseFloat> s(dim);
       Matrix<BaseFloat> P(dim, dim);
       cov.SymPosSemiDefEig(&s, &P);
       std::cout << s;
     }

   for (int32 i = 0; i < gmm.NumGauss(); i++) {
     BaseFloat logdet = -(inv_covars[i].LogPosDefDet());
     BaseFloat log_like = Log(gmm.weights()(i))
       -0.5 * (gmm.Dim() * M_LOG_2PI + logdet);
     Vector<BaseFloat> offset(feats);
     offset.AddVec(-1.0, means.Row(i));
     log_like -= 0.5 * VecSpVec(offset, inv_covars[i], offset);
     log_like_sum = LogAdd(log_like_sum, log_like);
   }
   return log_like_sum;
 }

 void test_flags_driven_update(const FullGmm &gmm,
                               const Matrix<BaseFloat> &feats,
                               GmmFlagsType flags) {
   MleFullGmmOptions config;
   AccumFullGmm est_gmm_allp;   // updates all params
   // let's trust that all-params update works
   AccumFullGmm est_gmm_somep;  // updates params indicated by flags

   // warm-up estimators
   est_gmm_allp.Resize(gmm.NumGauss(), gmm.Dim(), kGmmAll);
   est_gmm_allp.SetZero(kGmmAll);

   est_gmm_somep.Resize(gmm.NumGauss(), gmm.Dim(), flags);
   est_gmm_somep.SetZero(flags);

   // accumulate estimators
   for (int32 i = 0; i < feats.NumRows(); i++) {
     est_gmm_allp.AccumulateFromFull(gmm, feats.Row(i), 1.0F);
     est_gmm_somep.AccumulateFromFull(gmm, feats.Row(i), 1.0F);
   }

   FullGmm gmm_all_update;   // model with all params updated
   FullGmm gmm_some_update;  // model with some params updated
   gmm_all_update.CopyFromFullGmm(gmm);   // init with orig. model
   gmm_some_update.CopyFromFullGmm(gmm);  // init with orig. model

   MleFullGmmUpdate(config, est_gmm_allp, kGmmAll, &gmm_all_update, NULL, NULL);
   MleFullGmmUpdate(config, est_gmm_somep, flags, &gmm_some_update, NULL, NULL);

   if (gmm_all_update.NumGauss() != gmm.NumGauss()) {
     KALDI_WARN << "Unable to pass test_update_flags() test because of "
       "component removal during Update() call (this is normal)";
     return;
   }

   // now back-off the gmm_all_update params that were not updated
   // in gmm_some_update to orig.
   if (~flags & kGmmWeights)
     gmm_all_update.SetWeights(gmm.weights());
   if (~flags & kGmmMeans) {
     Matrix<BaseFloat> means(gmm.NumGauss(), gmm.Dim());
     gmm.GetMeans(&means);
     gmm_all_update.SetMeans(means);
   }
   if (~flags & kGmmVariances) {
     std::vector<SpMatrix<BaseFloat> > vars(gmm.NumGauss());
     for (int32 i = 0; i < gmm.NumGauss(); i++)
       vars[i].Resize(gmm.Dim());
     gmm.GetCovars(&vars);
     for (int32 i = 0; i < gmm.NumGauss(); i++)
       vars[i].InvertDouble();
     gmm_all_update.SetInvCovars(vars);
   }
   gmm_some_update.ComputeGconsts();
   gmm_all_update.ComputeGconsts();

   // now both models gmm_all_update, gmm_all_update have the same params updated
   // compute loglike for models for check
   double loglike0 = 0.0;
   double loglike1 = 0.0;
   double loglike2 = 0.0;
   for (int32 i = 0; i < feats.NumRows(); i++) {
     loglike0 += static_cast<double>(
       gmm.LogLikelihood(feats.Row(i)));
     loglike1 += static_cast<double>(
       gmm_all_update.LogLikelihood(feats.Row(i)));
     loglike2 += static_cast<double>(
       gmm_some_update.LogLikelihood(feats.Row(i)));
   }
   KALDI_LOG << "loglike1 = " << loglike1 << " loglike2 = " << loglike2;
   AssertEqual(loglike1, loglike2, 0.01);
 }

 void
 test_io(const FullGmm &gmm, const AccumFullGmm &est_gmm, bool binary,
         const Matrix<BaseFloat> &feats) {
   std::cout << "Testing I/O, binary = " << binary << '\n';

   est_gmm.Write(Output("tmp_stats", binary).Stream(), binary);

   bool binary_in;
   AccumFullGmm est_gmm2;
   est_gmm2.Resize(gmm.NumGauss(),
     gmm.Dim(), kGmmAll);
   Input ki("tmp_stats", &binary_in);
   est_gmm2.Read(ki.Stream(), binary_in, false);  // not adding

   Input ki2("tmp_stats", &binary_in);
   est_gmm2.Read(ki2.Stream(), binary_in, true);  // adding

   est_gmm2.Scale(0.5, kGmmAll);
     // 0.5 -> make it same as what it would have been if we read just once.
     // [may affect it due to removal of components with small counts].

   MleFullGmmOptions config;
   FullGmm gmm1;
   FullGmm gmm2;
   gmm1.CopyFromFullGmm(gmm);
   gmm2.CopyFromFullGmm(gmm);
   MleFullGmmUpdate(config, est_gmm, est_gmm.Flags(), &gmm1, NULL, NULL);
   MleFullGmmUpdate(config, est_gmm2, est_gmm2.Flags(), &gmm2, NULL, NULL);

   BaseFloat loglike1 = 0.0;
   BaseFloat loglike2 = 0.0;
   for (int32 i = 0; i < feats.NumRows(); i++) {
     loglike1 += gmm1.LogLikelihood(feats.Row(i));
     loglike2 += gmm2.LogLikelihood(feats.Row(i));
   }

   AssertEqual(loglike1, loglike2, 0.01);

   unlink("tmp_stats");
 }

 void
 UnitTestEstimateFullGmm() {
   // using namespace kaldi;

   // dimension of the gmm
   int32 dim = 10;

   // number of mixtures in the data
   int32 nMix = 7;

   // number of iterations for estimation
   int32 maxiterations = 20;

   // maximum number of densities in the GMM
   // larger than the number of mixtures in the data
   // so that we can test the removal of unseen components
   int32 maxcomponents = 50;

   // generate random feature vectors
   // first, generate parameters of vectors distribution
   // (mean and covariance matrices)
   Matrix<BaseFloat> means_f(nMix, dim);
   std::vector<SpMatrix<BaseFloat> > vars_f(nMix);
   std::vector<TpMatrix<BaseFloat> > vars_f_sqrt(nMix);
   for (int32 mix = 0; mix < nMix; mix++) {
     vars_f[mix].Resize(dim);
     vars_f_sqrt[mix].Resize(dim);
   }

   for (int32 m = 0; m < nMix; m++) {
     for (int32 d = 0; d < dim; d++) {
       means_f(m, d) = kaldi::RandGauss();
     }
     rand_posdef_spmatrix(dim, &vars_f[m], &vars_f_sqrt[m], NULL);
   }

   // second, generate 1000 feature vectors for each of the mixture components
   int32 counter = 0, multiple = 200;
   Matrix<BaseFloat> feats(nMix*200, dim);
   Vector<BaseFloat> rnd_vec(dim);
   for (int32 m = 0; m < nMix; m++) {
     for (int32 i = 0; i < multiple; i++) {
       for (int32 d = 0; d < dim; d++) {
         rnd_vec(d) = RandGauss();
       }
       feats.Row(counter).CopyFromVec(means_f.Row(m));
       feats.Row(counter).AddTpVec(1.0, vars_f_sqrt[m], kNoTrans, rnd_vec, 1.0);
       ++counter;
     }
   }

   {
     // Work out "perfect" log-like w/ one component.
     Matrix<BaseFloat> cov(dim, dim);
     Vector<BaseFloat> mean(dim);
     cov.AddMatMat(1.0, feats, kTrans, feats, kNoTrans, 0.0);
     cov.Scale(1.0 / feats.NumRows());
     mean.AddRowSumMat(1.0, feats);
     mean.Scale(1.0 / feats.NumRows());
     cov.AddVecVec(-1.0, mean, mean);
     BaseFloat logdet = cov.LogDet();
     BaseFloat avg_log = -0.5*(logdet + dim*(M_LOG_2PI + 1));
     std::cout << "Avg log-like per frame [full-cov, 1-mix] should be: "
       << avg_log << '\n';
     std::cout << "Total log-like [full-cov, 1-mix] should be: "
       << (feats.NumRows()*avg_log) << '\n';

     Vector<BaseFloat> s(dim);
     Matrix<BaseFloat> P(dim, dim);
     cov.SymPosSemiDefEig(&s, &P);
     std::cout << "Cov eigs are " << s;
   }

   // write the feature vectors to a file
   //  std::ofstream of("tmpfeats");
   //  of.precision(10);
   //  of << feats;
   //  of.close();

   // now generate randomly initial values for the GMM
   Vector<BaseFloat> weights(1);
   Matrix<BaseFloat> means(1, dim);
   std::vector<SpMatrix<BaseFloat> > invcovars(1);
   invcovars[0].Resize(dim);

   for (int32 d = 0; d < dim; d++) {
     means(0, d) = kaldi::RandGauss()*5.0F;
   }
   SpMatrix<BaseFloat> covar(dim);
   rand_posdef_spmatrix(dim, &covar, NULL, NULL);
   covar.AddToDiag(0.1);  // Ensure the condition is reasonable, otherwise
                          // we can get arbitrarily large inverse.
   invcovars[0].CopyFromSp(covar);
   invcovars[0].InvertDouble();
   weights(0) = 1.0F;

   // new GMM
   FullGmm *gmm = new FullGmm();
   gmm->Resize(1, dim);
   gmm->SetWeights(weights);
   gmm->SetInvCovarsAndMeans(invcovars, means);
   gmm->ComputeGconsts();

   {
     KALDI_LOG << "Testing natural<>normal conversion";
     FullGmmNormal ngmm(*gmm);
     FullGmm rgmm;
     rgmm.Resize(1, dim);
     ngmm.CopyToFullGmm(&rgmm, kGmmAll);

     // check contents
     KALDI_ASSERT(ApproxEqual(weights(0), 1.0F, 1e-6));
     KALDI_ASSERT(ApproxEqual(gmm->weights()(0), rgmm.weights()(0), 1e-6));
     double prec_m = 1e-3;
     double prec_v = 1e-3;
     for (int32 d = 0; d < dim; d++) {
       KALDI_ASSERT(std::abs(means.Row(0)(d) -  ngmm.means_.Row(0)(d)) < prec_m);
       KALDI_ASSERT(std::abs(gmm->means_invcovars().Row(0)(d) - rgmm.means_invcovars().Row(0)(d)) < prec_v);
       for (int32 d2 = d; d2 < dim; ++d2) {
         KALDI_ASSERT(std::abs(covar(d, d2) - ngmm.vars_[0](d, d2)) < prec_v);
         KALDI_ASSERT(std::abs(gmm->inv_covars()[0](d, d2) - rgmm.inv_covars()[0](d, d2)) < prec_v);
       }
     }
     KALDI_LOG << "OK";
   }

   MleFullGmmOptions config;
   GmmFlagsType flags_all = kGmmAll;


   AccumFullGmm est_gmm;
   est_gmm.Resize(gmm->NumGauss(), gmm->Dim(), flags_all);

   // iterate
   int32 iteration = 0;
   float lastloglike = 0.0;
   int32 lastloglike_nM = 0;

   while (iteration < maxiterations) {
     // First, resize accums for the case of component splitting
     est_gmm.Resize(gmm->NumGauss(),
       gmm->Dim(), flags_all);
     est_gmm.SetZero(flags_all);
     double loglike = 0.0;
     double loglike_test = 0.0;
     for (int32 i = 0; i < counter; i++) {
       loglike += static_cast<double>(
         est_gmm.AccumulateFromFull(*gmm, feats.Row(i), 1.0F));
       if (iteration < 4) {
         loglike_test += GetLogLikeTest(*gmm, feats.Row(i), (i == 0));
         AssertEqual(loglike, loglike_test);
       }
     }

     std::cout << "Loglikelihood before iteration "
       << iteration << " : " << std::scientific << loglike
       << " number of components: " << gmm->NumGauss() << '\n';

     // std::cout << "Model is: " << *gmm;

     // every 5th iteration check loglike change and update lastloglike
     if (iteration % 5 == 0) {
       // likelihood should be increasing on the long term
       if ((iteration > 0) && (gmm->NumGauss() >= lastloglike_nM)) {
         KALDI_ASSERT(loglike > lastloglike);
       }
       lastloglike = loglike;
       lastloglike_nM = gmm->NumGauss();
     }

     BaseFloat obj, count;
     MleFullGmmUpdate(config, est_gmm, flags_all, gmm, &obj, &count);
     KALDI_LOG << "ML objective function change = " << (obj/count)
               << " per frame, over " << (count) << " frames.";

     // split components to double count at second iteration
     // and every next 3rd iteration
     // stop splitting when maxcomponents reached
     if ( (iteration < maxiterations - 3) && (iteration % 4 == 1)
         && (gmm->NumGauss() * 2 <= maxcomponents)) {
       gmm->Split(gmm->NumGauss() * 2, 0.01);
     }

     if (iteration == 5) {  // run following tests with not too overfitted model
       std::cout << "Testing flags-driven updates kGmmAll" << '\n';
       test_flags_driven_update(*gmm, feats, kGmmAll);
       std::cout << "Testing flags-driven updates kGmmWeights" << '\n';
       test_flags_driven_update(*gmm, feats, kGmmWeights);
       std::cout << "Testing flags-driven kGmmMeans" << '\n';
       test_flags_driven_update(*gmm, feats, kGmmMeans);
       std::cout << "Testing flags-driven kGmmVariances" << '\n';
       test_flags_driven_update(*gmm, feats, kGmmVariances);
       std::cout << "Testing flags-driven kGmmWeights | kGmmMeans" << '\n';
       test_flags_driven_update(*gmm, feats, kGmmWeights | kGmmMeans);
       std::cout << "Testing component-wise accumulation" << '\n';
       TestComponentAcc(*gmm, feats);
     }

     iteration++;
   }

   {  // I/O tests
     GmmFlagsType flags_all = kGmmAll;
     est_gmm.Resize(gmm->NumGauss(),
       gmm->Dim(), flags_all);
     est_gmm.SetZero(flags_all);
     float loglike = 0.0;
     for (int32 i = 0; i < counter; i++) {
       loglike += est_gmm.AccumulateFromFull(*gmm, feats.Row(i), 1.0F);
     }
     test_io(*gmm, est_gmm, false, feats);
     test_io(*gmm, est_gmm, true, feats);
   }

   delete gmm;
   gmm = NULL;
 }

 int
 main() {
   // repeat the test five times
   for (int i = 0; i < 2; i++)
     UnitTestEstimateFullGmm();
   std::cout << "Test OK.\n";
 }
kaldi::AccumFullGmm::Write
void Write(std::ostream &out_stream, bool binary) const
Definition: mle-full-gmm.cc:230

kaldi::SpMatrix::AddMat2
void AddMat2(const Real alpha, const MatrixBase< Real > &M, MatrixTransposeType transM, const Real beta)
rank-N update: if (transM == kNoTrans) (*this) = beta*(*this) + alpha * M * M^T, or (if transM == kTr...
Definition: sp-matrix.cc:1110

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::FullGmm::SetWeights
void SetWeights(const Vector< Real > &w)
Mutators for both float or double.
Definition: full-gmm-inl.h:31

test_io
void test_io(const FullGmm &gmm, const AccumFullGmm &est_gmm, bool binary, const Matrix< BaseFloat > &feats)
Definition: mle-full-gmm-test.cc:219

kaldi::SpMatrix
Packed symetric matrix class.
Definition: matrix-common.h:62

rand_posdef_spmatrix
void rand_posdef_spmatrix(size_t dim, SpMatrix< BaseFloat > *matrix, TpMatrix< BaseFloat > *matrix_sqrt=NULL, BaseFloat *logdet=NULL)
Definition: mle-full-gmm-test.cc:90

kaldi::FullGmm::inv_covars
const std::vector< SpMatrix< BaseFloat > > & inv_covars() const
Definition: full-gmm.h:146

stl-utils.h

M_LOG_2PI
#define M_LOG_2PI
Definition: kaldi-math.h:60

kaldi::AccumFullGmm::NumGauss
int32 NumGauss() const
Returns the number of mixture components.
Definition: mle-full-gmm.h:97

diag-gmm.h

kaldi::Input
Definition: kaldi-io.h:190

kaldi::VectorBase::AddRowSumMat
void AddRowSumMat(Real alpha, const MatrixBase< Real > &M, Real beta=1.0)
Does *this = alpha * (sum of rows of M) + beta * *this.
Definition: kaldi-vector.cc:714

kaldi::FullGmm::ComponentPosteriors
BaseFloat ComponentPosteriors(const VectorBase< BaseFloat > &data, VectorBase< BaseFloat > *posterior) const
Computes the posterior probabilities of all Gaussian components given a data point.
Definition: full-gmm.cc:719

kaldi::FullGmm::Dim
int32 Dim() const
Returns the dimensionality of the Gaussian mean vectors.
Definition: full-gmm.h:60

kaldi::FullGmmNormal
Definition for Gaussian Mixture Model with full covariances in normal mode: where the parameters are ...
Definition: full-gmm-normal.h:45

kaldi::MatrixBase::Cond
Real Cond() const
Returns condition number by computing Svd.
Definition: kaldi-matrix.cc:1696

kaldi::MleFullGmmOptions
Configuration variables like variance floor, minimum occupancy, etc.
Definition: mle-full-gmm.h:38

kaldi::FullGmm::ComputeGconsts
int32 ComputeGconsts()
Sets the gconsts.
Definition: full-gmm.cc:92

kaldi::FullGmm::Split
void Split(int32 target_components, float perturb_factor, std::vector< int32 > *history=NULL)
Merge the components and remember the order in which the components were merged (flat list of pairs) ...
Definition: full-gmm.cc:132

kaldi::FullGmm
Definition for Gaussian Mixture Model with full covariances.
Definition: full-gmm.h:40

mle-diag-gmm.h

kaldi::MatrixBase::SymPosSemiDefEig
void SymPosSemiDefEig(VectorBase< Real > *s, MatrixBase< Real > *P, Real check_thresh=0.001)
Uses Svd to compute the eigenvalue decomposition of a symmetric positive semi-definite matrix: (*this...
Definition: kaldi-matrix.cc:1996

main
int main()
Definition: mle-full-gmm-test.cc:478

kaldi::FullGmm::SetInvCovarsAndMeans
void SetInvCovarsAndMeans(const std::vector< SpMatrix< Real > > &invcovars, const Matrix< Real > &means)
Use SetInvCovarsAndMeans if updating both means and (inverse) covariances.
Definition: full-gmm-inl.h:50

kaldi::RandGauss
float RandGauss(struct RandomState *state=NULL)
Definition: kaldi-math.h:155

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::Matrix< BaseFloat >

kaldi::GmmFlagsType
uint16 GmmFlagsType
Bitwise OR of the above flags.
Definition: model-common.h:35

kaldi::AccumFullGmm::SetZero
void SetZero(GmmFlagsType flags)
Definition: mle-full-gmm.cc:63

kaldi::AccumFullGmm::Flags
GmmFlagsType Flags() const
Accessors.
Definition: mle-full-gmm.h:126

kaldi::PackedMatrix::NumRows
MatrixIndexT NumRows() const
Definition: packed-matrix.h:104

kaldi::FullGmm::GetCovars
void GetCovars(std::vector< SpMatrix< Real > > *v) const
Accessor for covariances.
Definition: full-gmm-inl.h:106

kaldi::FullGmmNormal::vars_
std::vector< SpMatrix< double > > vars_
covariances
Definition: full-gmm-normal.h:68

kaldi::kTrans
Definition: matrix-common.h:33

mle-full-gmm.h

kaldi::AccumFullGmm::Resize
void Resize(int32 num_components, int32 dim, GmmFlagsType flags)
Allocates memory for accumulators.
Definition: mle-full-gmm.cc:37

full-gmm.h

kaldi::PackedMatrix::AddToDiag
void AddToDiag(const Real r)
Definition: packed-matrix.cc:123

count
const size_t count
Definition: arpa-file-parser-test.cc:66

kaldi::FullGmm::CopyFromFullGmm
void CopyFromFullGmm(const FullGmm &fullgmm)
Copies from given FullGmm.
Definition: full-gmm.cc:65

kaldi::Input::Stream
std::istream & Stream()
Definition: kaldi-io.cc:826

kaldi::TpMatrix::Cholesky
void Cholesky(const SpMatrix< Real > &orig)
Definition: tp-matrix.cc:88

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::kGmmMeans
Definition: model-common.h:29

kaldi::FullGmm::Resize
void Resize(int32 nMix, int32 dim)
Resizes arrays to this dim. Does not initialize data.
Definition: full-gmm.cc:41

test_flags_driven_update
void test_flags_driven_update(const FullGmm &gmm, const Matrix< BaseFloat > &feats, GmmFlagsType flags)
Definition: mle-full-gmm-test.cc:145

kaldi::SpMatrix::LogPosDefDet
Real LogPosDefDet() const
Computes log determinant but only for +ve-def matrices (it uses Cholesky).
Definition: sp-matrix.cc:36

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

kaldi::Log
double Log(double x)
Definition: kaldi-math.h:100

kaldi::kGmmVariances
Definition: model-common.h:30

kaldi::MatrixBase::Scale
void Scale(Real alpha)
Multiply each element with a scalar value.
Definition: kaldi-matrix.cc:1209

kaldi-io.h

UnitTestEstimateFullGmm
void UnitTestEstimateFullGmm()
Definition: mle-full-gmm-test.cc:260

kaldi::MleFullGmmUpdate
void MleFullGmmUpdate(const MleFullGmmOptions &config, const AccumFullGmm &fullgmm_acc, GmmFlagsType flags, FullGmm *gmm, BaseFloat *obj_change_out, BaseFloat *count_out)
for computing the maximum-likelihood estimates of the parameters of a Gaussian mixture model...
Definition: mle-full-gmm.cc:282

kaldi::MatrixBase::SetRandn
void SetRandn()
Sets to random values of a normal distribution.
Definition: kaldi-matrix.cc:1355

kaldi::MatrixBase::AddMatMat
void AddMatMat(const Real alpha, const MatrixBase< Real > &A, MatrixTransposeType transA, const MatrixBase< Real > &B, MatrixTransposeType transB, const Real beta)
Definition: kaldi-matrix.cc:171

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::AccumFullGmm
Class for computing the maximum-likelihood estimates of the parameters of a Gaussian mixture model...
Definition: mle-full-gmm.h:74

kaldi::VecSpVec
Real VecSpVec(const VectorBase< Real > &v1, const SpMatrix< Real > &M, const VectorBase< Real > &v2)
Computes v1^T * M * v2.
Definition: sp-matrix.cc:964

kaldi::TpMatrix
Packed symetric matrix class.
Definition: matrix-common.h:63

GetLogLikeTest
BaseFloat GetLogLikeTest(const FullGmm &gmm, const VectorBase< BaseFloat > &feats, bool print_eigs)
Definition: mle-full-gmm-test.cc:113

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::FullGmmNormal::CopyToFullGmm
void CopyToFullGmm(FullGmm *fullgmm, GmmFlagsType flags=kGmmAll)
Copies to FullGmm.
Definition: full-gmm-normal.cc:76

kaldi::FullGmm::NumGauss
int32 NumGauss() const
Returns the number of mixture components in the GMM.
Definition: full-gmm.h:58

kaldi::VectorBase::Scale
void Scale(Real alpha)
Multiplies all elements by this constant.
Definition: kaldi-vector.cc:963

kaldi::FullGmm::weights
const Vector< BaseFloat > & weights() const
Definition: full-gmm.h:144

kaldi::kGmmAll
Definition: model-common.h:33

kaldi::AccumFullGmm::Read
void Read(std::istream &in_stream, bool binary, bool add)
Definition: mle-full-gmm.cc:171

kaldi::LogAdd
double LogAdd(double x, double y)
Definition: kaldi-math.h:184

kaldi::FullGmm::GetMeans
void GetMeans(Matrix< Real > *m) const
Accessor for means.
Definition: full-gmm-inl.h:118

TestComponentAcc
void TestComponentAcc(const FullGmm &gmm, const Matrix< BaseFloat > &feats)
Definition: mle-full-gmm-test.cc:31

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::FullGmm::SetInvCovars
void SetInvCovars(const std::vector< SpMatrix< Real > > &v)
Set the (inverse) covariances and recompute means_invcovars_.
Definition: full-gmm-inl.h:83

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::MatrixBase::LogDet
Real LogDet(Real *det_sign=NULL) const
Returns logdet of matrix.
Definition: kaldi-matrix.cc:2038

kaldi::MatrixBase::AddVecVec
void AddVecVec(const Real alpha, const VectorBase< OtherReal > &a, const VectorBase< OtherReal > &b)
*this += alpha * a * b^T
Definition: kaldi-matrix.cc:129

kaldi::AssertEqual
static void AssertEqual(float a, float b, float relative_tolerance=0.001)
assert abs(a - b) <= relative_tolerance * (abs(a)+abs(b))
Definition: kaldi-math.h:276

kaldi::Output
Definition: kaldi-io.h:124

model-common.h

kaldi::AccumFullGmm::AccumulateFromFull
BaseFloat AccumulateFromFull(const FullGmm &gmm, const VectorBase< BaseFloat > &data, BaseFloat frame_posterior)
Accumulate for all components given a full-covariance GMM.
Definition: mle-full-gmm.cc:143

kaldi::kGmmWeights
Definition: model-common.h:31

kaldi::FullGmm::means_invcovars
const Matrix< BaseFloat > & means_invcovars() const
Definition: full-gmm.h:145

kaldi::SpMatrix::SymPosSemiDefEig
void SymPosSemiDefEig(VectorBase< Real > *s, MatrixBase< Real > *P, Real tolerance=0.001) const
This is the version of SVD that we implement for symmetric positive definite matrices.
Definition: sp-matrix.cc:57

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::FullGmmNormal::means_
Matrix< double > means_
Means.
Definition: full-gmm-normal.h:67

kaldi::SpMatrix::Invert
void Invert(Real *logdet=NULL, Real *det_sign=NULL, bool inverse_needed=true)
matrix inverse.
Definition: sp-matrix.cc:219

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::VectorBase::AddVec
void AddVec(const Real alpha, const VectorBase< OtherReal > &v)
Add vector : *this = *this + alpha * rv (with casting between floats and doubles) ...
Definition: kaldi-vector.cc:1044

kaldi::FullGmm::LogLikelihood
BaseFloat LogLikelihood(const VectorBase< BaseFloat > &data) const
Returns the log-likelihood of a data point (vector) given the GMM.
Definition: full-gmm.cc:582

kaldi::FullGmm::SetMeans
void SetMeans(const Matrix< Real > &m)
Use SetMeans to update only the Gaussian means (and not variances)
Definition: full-gmm-inl.h:38

kaldi::ApproxEqual
static bool ApproxEqual(float a, float b, float relative_tolerance=0.001)
return abs(a - b) <= relative_tolerance * (abs(a)+abs(b)).
Definition: kaldi-math.h:265

kaldi::AccumFullGmm::Scale
void Scale(BaseFloat f, GmmFlagsType flags)
Definition: mle-full-gmm.cc:79

rnnlm::d
double d
Definition: mikolov-rnnlm-lib.cc:64

kaldi::AccumFullGmm::AccumulateForComponent
void AccumulateForComponent(const VectorBase< BaseFloat > &data, int32 comp_index, BaseFloat weight)
Accumulate for a single component, given the posterior.
Definition: mle-full-gmm.cc:96