doc/estimate-am-sgmm2-test_8cc_source.html

 // sgmm2/estimate-am-sgmm2-test.cc

 // Copyright 2009-2011  Saarland University (author:  Arnab Ghoshal)
 //           2012-2013  Johns Hopkins University (author: Daniel Povey)
 //                      Arnab Ghoshal

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "base/kaldi-math.h"
 #include "gmm/model-test-common.h"
 #include "sgmm2/am-sgmm2.h"
 #include "sgmm2/estimate-am-sgmm2.h"
 #include "util/kaldi-io.h"

 using kaldi::AmSgmm2;
 using kaldi::MleAmSgmm2Accs;
 using kaldi::int32;
 using kaldi::BaseFloat;
 using kaldi::Exp;

 namespace ut = kaldi::unittest;

 // Tests the Read() and Write() methods for the accumulators, in both binary
 // and ASCII mode, as well as Check().
 void TestSgmm2AccsIO(const AmSgmm2 &sgmm,
                      const kaldi::Matrix<BaseFloat> &feats) {
   using namespace kaldi;
   kaldi::SgmmUpdateFlagsType flags = kaldi::kSgmmAll & ~kSgmmSpeakerWeightProjections;
   kaldi::Sgmm2PerFrameDerivedVars frame_vars;
   kaldi::Sgmm2PerSpkDerivedVars empty;
   frame_vars.Resize(sgmm.NumGauss(), sgmm.FeatureDim(),
                     sgmm.PhoneSpaceDim());
   kaldi::Sgmm2GselectConfig sgmm_config;
   sgmm_config.full_gmm_nbest = std::min(sgmm_config.full_gmm_nbest,
                                         sgmm.NumGauss());
   MleAmSgmm2Accs accs(sgmm, flags, true);
   BaseFloat loglike = 0.0;

   for (int32 i = 0; i < feats.NumRows(); i++) {
     std::vector<int32> gselect;
     sgmm.GaussianSelection(sgmm_config, feats.Row(i), &gselect);
     sgmm.ComputePerFrameVars(feats.Row(i), gselect, empty, &frame_vars);
     loglike += accs.Accumulate(sgmm, frame_vars, 0, 1.0, &empty);
   }
   accs.CommitStatsForSpk(sgmm, empty);

   kaldi::MleAmSgmm2Options update_opts;
   AmSgmm2 *sgmm1 = new AmSgmm2();
   sgmm1->CopyFromSgmm2(sgmm, false, false);
   kaldi::MleAmSgmm2Updater updater(update_opts);
   updater.Update(accs, sgmm1, flags);
   sgmm1->ComputeDerivedVars();
   std::vector<int32> gselect;
   Sgmm2LikelihoodCache like_cache(sgmm.NumGroups(), sgmm.NumPdfs());

   sgmm1->GaussianSelection(sgmm_config, feats.Row(0), &gselect);
   sgmm1->ComputePerFrameVars(feats.Row(0), gselect, empty, &frame_vars);
   BaseFloat loglike1 = sgmm1->LogLikelihood(frame_vars, 0, &like_cache, &empty);
   delete sgmm1;

   // First, non-binary write
   accs.Write(kaldi::Output("tmpf", false).Stream(), false);
   bool binary_in;
   MleAmSgmm2Accs *accs1 = new MleAmSgmm2Accs();
   // Non-binary read
   kaldi::Input ki1("tmpf", &binary_in);
   accs1->Read(ki1.Stream(), binary_in, false);
   accs1->Check(sgmm, true);
   AmSgmm2 *sgmm2 = new AmSgmm2();
   sgmm2->CopyFromSgmm2(sgmm, false, false);
   updater.Update(*accs1, sgmm2, flags);
   sgmm2->ComputeDerivedVars();
   sgmm2->GaussianSelection(sgmm_config, feats.Row(0), &gselect);
   sgmm2->ComputePerFrameVars(feats.Row(0), gselect, empty, &frame_vars);
   Sgmm2LikelihoodCache like_cache2(sgmm2->NumGroups(), sgmm2->NumPdfs());
   BaseFloat loglike2 = sgmm2->LogLikelihood(frame_vars, 0, &like_cache2, &empty);
   kaldi::AssertEqual(loglike1, loglike2, 1e-4);
   delete accs1;

   // Next, binary write
   accs.Write(kaldi::Output("tmpfb", true).Stream(), true);
   MleAmSgmm2Accs *accs2 = new MleAmSgmm2Accs();
   // Binary read
   kaldi::Input ki2("tmpfb", &binary_in);
   accs2->Read(ki2.Stream(), binary_in, false);
   accs2->Check(sgmm, true);
   AmSgmm2 *sgmm3 = new AmSgmm2();
   sgmm3->CopyFromSgmm2(sgmm, false, false);
   updater.Update(*accs2, sgmm3, flags);
   sgmm3->ComputeDerivedVars();
   sgmm3->GaussianSelection(sgmm_config, feats.Row(0), &gselect);
   sgmm3->ComputePerFrameVars(feats.Row(0), gselect, empty, &frame_vars);
   Sgmm2LikelihoodCache like_cache3(sgmm3->NumGroups(), sgmm3->NumPdfs());
   BaseFloat loglike3 = sgmm3->LogLikelihood(frame_vars, 0, &like_cache3, &empty);
   kaldi::AssertEqual(loglike1, loglike3, 1e-6);

   // Testing the MAP update of M
   update_opts.tau_map_M = 10;
   update_opts.full_col_cov = (RandUniform() > 0.5)? true : false;
   update_opts.full_row_cov = (RandUniform() > 0.5)? true : false;
   kaldi::MleAmSgmm2Updater updater_map(update_opts);
   sgmm3->CopyFromSgmm2(sgmm, false, false);
   updater_map.Update(*accs2, sgmm3, flags);

   delete accs2;
   delete sgmm2;
   delete sgmm3;

   unlink("tmpf");
   unlink("tmpfb");
 }

 void UnitTestEstimateSgmm2() {
   int32 dim = 1 + kaldi::RandInt(0, 9);  // random dimension of the gmm
   int32 num_comp = 2 + kaldi::RandInt(0, 9);  // random mixture size
   kaldi::FullGmm full_gmm;
   ut::InitRandFullGmm(dim, num_comp, &full_gmm);

   AmSgmm2 sgmm;
   kaldi::Sgmm2GselectConfig config;
   std::vector<int32> pdf2group;
   pdf2group.push_back(0);
   sgmm.InitializeFromFullGmm(full_gmm, pdf2group, dim+1, dim, false, 0.9); // TODO-- make this true!
   sgmm.ComputeNormalizers();

   kaldi::Matrix<BaseFloat> feats;

   {  // First, generate random means and variances
     int32 num_feat_comp = num_comp + kaldi::RandInt(-num_comp/2, num_comp/2);
     kaldi::Matrix<BaseFloat> means(num_feat_comp, dim),
         vars(num_feat_comp, dim);
     for (int32 m = 0; m < num_feat_comp; m++) {
       for (int32 d= 0; d < dim; d++) {
         means(m, d) = kaldi::RandGauss();
         vars(m, d) = Exp(kaldi::RandGauss()) + 1e-2;
       }
     }
     // Now generate random features with those means and variances.
     feats.Resize(num_feat_comp * 200, dim);
     for (int32 m = 0; m < num_feat_comp; m++) {
       kaldi::SubMatrix<BaseFloat> tmp(feats, m*200, 200, 0, dim);
       ut::RandDiagGaussFeatures(200, means.Row(m), vars.Row(m), &tmp);
     }
   }
   sgmm.ComputeDerivedVars();
   TestSgmm2AccsIO(sgmm, feats);
 }

 int main() {
   for (int i = 0; i < 10; i++)
     UnitTestEstimateSgmm2();
   std::cout << "Test OK.\n";
   return 0;
 }
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::Exp
double Exp(double x)
Definition: kaldi-math.h:83

kaldi::AmSgmm2::Write
void Write(std::ostream &os, bool binary, SgmmWriteFlagsType write_params) const
Definition: am-sgmm2.cc:203

kaldi::AmSgmm2
Class for definition of the subspace Gmm acoustic model.
Definition: am-sgmm2.h:231

kaldi::Input
Definition: kaldi-io.h:190

kaldi::AmSgmm2::CopyFromSgmm2
void CopyFromSgmm2(const AmSgmm2 &other, bool copy_normalizers, bool copy_weights)
Used to copy models (useful in update)
Definition: am-sgmm2.cc:415

kaldi::RandUniform
float RandUniform(struct RandomState *state=NULL)
Returns a random number strictly between 0 and 1.
Definition: kaldi-math.h:151

UnitTestEstimateSgmm2
void UnitTestEstimateSgmm2()
Definition: estimate-am-sgmm2-test.cc:126

kaldi::FullGmm
Definition for Gaussian Mixture Model with full covariances.
Definition: full-gmm.h:40

kaldi::MleAmSgmm2Accs::Read
void Read(std::istream &in_stream, bool binary, bool add)
Definition: estimate-am-sgmm2.cc:122

kaldi::AmSgmm2::InitializeFromFullGmm
void InitializeFromFullGmm(const FullGmm &gmm, const std::vector< int32 > &pdf2group, int32 phn_subspace_dim, int32 spk_subspace_dim, bool speaker_dependent_weights, BaseFloat self_weight)
Initializes the SGMM parameters from a full-covariance UBM.
Definition: am-sgmm2.cc:381

model-test-common.h

kaldi::RandGauss
float RandGauss(struct RandomState *state=NULL)
Definition: kaldi-math.h:155

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::Matrix< BaseFloat >

TestSgmm2AccsIO
void TestSgmm2AccsIO(const AmSgmm2 &sgmm, const kaldi::Matrix< BaseFloat > &feats)
Definition: estimate-am-sgmm2-test.cc:38

kaldi-math.h

kaldi::AmSgmm2::PhoneSpaceDim
int32 PhoneSpaceDim() const
Definition: am-sgmm2.h:361

kaldi::MleAmSgmm2Options::full_row_cov
bool full_row_cov
Estimate row covariance instead of using I.
Definition: estimate-am-sgmm2.h:63

kaldi::MleAmSgmm2Updater::Update
void Update(const MleAmSgmm2Accs &accs, AmSgmm2 *model, SgmmUpdateFlagsType flags)
Definition: estimate-am-sgmm2.cc:612

kaldi::AmSgmm2::FeatureDim
int32 FeatureDim() const
Definition: am-sgmm2.h:363

kaldi::Input::Stream
std::istream & Stream()
Definition: kaldi-io.cc:826

kaldi::AmSgmm2::NumGroups
int32 NumGroups() const
Definition: am-sgmm2.h:351

kaldi::kSgmmSpeakerWeightProjections
t .. not really part of SGMM.
Definition: model-common.h:55

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::AmSgmm2::LogLikelihood
BaseFloat LogLikelihood(const Sgmm2PerFrameDerivedVars &per_frame_vars, int32 j2, Sgmm2LikelihoodCache *cache, Sgmm2PerSpkDerivedVars *spk_vars, BaseFloat log_prune=0.0) const
This does a likelihood computation for a given state using the pre-selected Gaussian components (in p...
Definition: am-sgmm2.cc:517

kaldi::SgmmUpdateFlagsType
uint16 SgmmUpdateFlagsType
Bitwise OR of the above flags.
Definition: model-common.h:59

kaldi::MleAmSgmm2Options::full_col_cov
bool full_col_cov
Estimate col covariance instead of using I.
Definition: estimate-am-sgmm2.h:64

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

main
int main()
Definition: estimate-am-sgmm2-test.cc:162

kaldi-io.h

kaldi::AmSgmm2::GaussianSelection
BaseFloat GaussianSelection(const Sgmm2GselectConfig &config, const VectorBase< BaseFloat > &data, std::vector< int32 > *gselect) const
Computes the top-scoring Gaussian indices (used for pruning of later stages of computation).
Definition: am-sgmm2.cc:1406

kaldi::AmSgmm2::NumPdfs
int32 NumPdfs() const
Various model dimensions.
Definition: am-sgmm2.h:350

kaldi::Sgmm2GselectConfig::full_gmm_nbest
int32 full_gmm_nbest
Number of highest-scoring full-covariance Gaussians per frame.
Definition: am-sgmm2.h:120

am-sgmm2.h

kaldi::AmSgmm2::ComputePerFrameVars
void ComputePerFrameVars(const VectorBase< BaseFloat > &data, const std::vector< int32 > &gselect, const Sgmm2PerSpkDerivedVars &spk_vars, Sgmm2PerFrameDerivedVars *per_frame_vars) const
This needs to be called with each new frame of data, prior to accumulation or likelihood evaluation: ...
Definition: am-sgmm2.cc:442

kaldi::Sgmm2PerFrameDerivedVars::Resize
void Resize(int32 ngauss, int32 feat_dim, int32 phn_dim)
Definition: am-sgmm2.h:151

kaldi::AmSgmm2::NumGauss
int32 NumGauss() const
Definition: am-sgmm2.h:360

kaldi::Sgmm2GselectConfig
Definition: am-sgmm2.h:118

estimate-am-sgmm2.h

kaldi::MleAmSgmm2Accs::Write
void Write(std::ostream &out_stream, bool binary) const
Definition: estimate-am-sgmm2.cc:34

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::unittest::InitRandFullGmm
void InitRandFullGmm(int32 dim, int32 num_comp, FullGmm *gmm)
Definition: model-test-common.cc:110

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::Sgmm2PerSpkDerivedVars
Definition: am-sgmm2.h:165

kaldi::AmSgmm2::ComputeDerivedVars
void ComputeDerivedVars()
Computes (and initializes if necessary) derived vars...
Definition: am-sgmm2.cc:810

kaldi::AmSgmm2::ComputeNormalizers
void ComputeNormalizers()
Computes the data-independent terms in the log-likelihood computation for each Gaussian component and...
Definition: am-sgmm2.cc:857

kaldi::AssertEqual
static void AssertEqual(float a, float b, float relative_tolerance=0.001)
assert abs(a - b) <= relative_tolerance * (abs(a)+abs(b))
Definition: kaldi-math.h:276

kaldi::Sgmm2LikelihoodCache
Sgmm2LikelihoodCache caches SGMM likelihoods at two levels: the final pdf likelihoods, and the sub-state level likelihoods, which means that with the SCTM system we can avoid redundant computation.
Definition: am-sgmm2.h:199

kaldi::MleAmSgmm2Options::tau_map_M
BaseFloat tau_map_M
For MAP update of the phonetic subspace M.
Definition: estimate-am-sgmm2.h:61

kaldi::unittest::RandDiagGaussFeatures
void RandDiagGaussFeatures(int32 num_samples, const VectorBase< BaseFloat > &mean, const VectorBase< BaseFloat > &sqrt_var, MatrixBase< BaseFloat > *feats)
Definition: model-test-common.cc:52

kaldi::Output
Definition: kaldi-io.h:124

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::MleAmSgmm2Accs::Check
void Check(const AmSgmm2 &model, bool show_properties=true) const
Checks the various accumulators for correct sizes given a model.
Definition: estimate-am-sgmm2.cc:213

kaldi::MleAmSgmm2Options
Configuration variables needed in the SGMM estimation process.
Definition: estimate-am-sgmm2.h:40

kaldi::unittest
Definition: model-test-common.cc:28

kaldi::MleAmSgmm2Accs
Class for the accumulators associated with the phonetic-subspace model parameters.
Definition: estimate-am-sgmm2.h:119

kaldi::Sgmm2PerFrameDerivedVars
Holds the per-frame precomputed quantities x(t), x_{i}(t), z_{i}(t), and n_{i}(t) (cf...
Definition: am-sgmm2.h:142

kaldi::SubMatrix
Sub-matrix representation.
Definition: kaldi-matrix.h:988

kaldi::MleAmSgmm2Updater
Definition: estimate-am-sgmm2.h:246

rnnlm::d
double d
Definition: mikolov-rnnlm-lib.cc:64

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95

kaldi::kSgmmAll
u [ for SSGMM ]
Definition: model-common.h:56