doc/fmllr-raw-test_8cc_source.html

 // transform/fmllr-raw-test.cc

 // Copyright  2009-2011 Microsoft Corporation
 //            2013  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "util/common-utils.h"
 #include "gmm/diag-gmm.h"
 #include "transform/fmllr-diag-gmm.h"
 #include "transform/fmllr-raw.h"

 namespace kaldi {


 void InitRandomGmm (DiagGmm *gmm_in) {
   int32 num_gauss = 5 + rand () % 4;
   int32 dim = 6 + Rand() % 5;
   DiagGmm &gmm(*gmm_in);
   gmm.Resize(num_gauss, dim);
   Matrix<BaseFloat> inv_vars(num_gauss, dim),
       means(num_gauss, dim);
   Vector<BaseFloat> weights(num_gauss);
   for (int32 i = 0; i < num_gauss; i++) {
     for (int32 j = 0; j < dim; j++) {
       inv_vars(i, j) = Exp(RandGauss() * (1.0 / (1 + j)));
       means(i, j) = RandGauss() * (1.0 / (1 + j));
     }
     weights(i) = Exp(RandGauss());
   }
   weights.Scale(1.0 / weights.Sum());
   gmm.SetWeights(weights);
   gmm.SetInvVarsAndMeans(inv_vars, means);
   gmm.ComputeGconsts();
 }

 void UnitTestFmllrRaw(bool use_offset) {
   using namespace kaldi;
   DiagGmm gmm;
   InitRandomGmm(&gmm);
   int32 model_dim =  gmm.Dim();

   int32 raw_dim = 5 + Rand() % 3;
   int32 num_splice = 1 + Rand() % 5;
   while (num_splice * raw_dim < model_dim) {
     num_splice++;
   }

   int32 full_dim = num_splice * raw_dim;
   int32 npoints = raw_dim*(raw_dim+1)*10;

   Matrix<BaseFloat> rand_points(npoints, full_dim);
   rand_points.SetRandn();

   Matrix<BaseFloat> lda_mllt(full_dim, full_dim + (use_offset ? 1 : 0)); // This is the full LDA+MLLT
   // matrix.  TODO: test with offset.
   lda_mllt.SetRandn();

   FmllrRawAccs accs(raw_dim, model_dim, lda_mllt);

   BaseFloat prev_objf_impr;
   for (int32 iter = 0; iter < 4; iter++) {

     for (int32 i = 0; i < npoints; i++) {
       SubVector<BaseFloat> sample(rand_points, i);
       accs.AccumulateForGmm(gmm, sample, 1.0);
     }

     Matrix<BaseFloat> fmllr_mat(raw_dim, raw_dim + 1);
     fmllr_mat.SetUnit(); // sets diagonal elements to one.

     FmllrRawOptions opts;
     BaseFloat objf_impr, count;
     accs.Update(opts, &fmllr_mat, &objf_impr, &count);

     KALDI_ASSERT(objf_impr > 0.0);

     if (iter != 0) {
       // This is not something provable, but is always true
       // in practice.
       KALDI_ASSERT(objf_impr < prev_objf_impr);
     }
     prev_objf_impr = objf_impr;


     // Now transform the raw features.
     for (int32 splice = 0; splice < num_splice; splice++) {
       SubMatrix<BaseFloat> raw_feats(rand_points,
                                      0, npoints,
                                      splice * raw_dim, raw_dim);
       for (int32 t = 0; t < npoints; t++) {
         SubVector<BaseFloat> this_feat(raw_feats, t);
         ApplyAffineTransform(fmllr_mat, &this_feat);
       }
     }
     accs.SetZero();
   }
 }


 }  // namespace kaldi ends here

 int main() {
   kaldi::g_kaldi_verbose_level = 5;

   for (int i = 0; i < 2; i++) {  // did more iterations when first testing...
     kaldi::UnitTestFmllrRaw(i % 2 == 0);
   }
   std::cout << "Test OK.\n";
 }
kaldi::InitRandomGmm
void InitRandomGmm(DiagGmm *gmm_in)
Definition: diag-gmm-test.cc:27

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::Exp
double Exp(double x)
Definition: kaldi-math.h:83

kaldi::DiagGmm::Dim
int32 Dim() const
Returns the dimensionality of the Gaussian mean vectors.
Definition: diag-gmm.h:74

diag-gmm.h

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::FmllrRawAccs::Update
void Update(const FmllrRawOptions &opts, MatrixBase< BaseFloat > *raw_fmllr_mat, BaseFloat *objf_impr, BaseFloat *count)
Update "raw_fmllr_mat"; it should have the correct dimension and reasonable values at entry (see the ...
Definition: fmllr-raw.cc:299

kaldi::RandGauss
float RandGauss(struct RandomState *state=NULL)
Definition: kaldi-math.h:155

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::Matrix< BaseFloat >

kaldi::FmllrRawAccs::SetZero
void SetZero()
Definition: fmllr-raw.cc:402

kaldi::MatrixBase::SetUnit
void SetUnit()
Sets to zero, except ones along diagonal [for non-square matrices too].
Definition: kaldi-matrix.cc:1348

count
const size_t count
Definition: arpa-file-parser-test.cc:66

kaldi::UnitTestFmllrRaw
void UnitTestFmllrRaw(bool use_offset)
Definition: fmllr-raw-test.cc:50

float

kaldi::FmllrRawOptions
Definition: fmllr-raw.h:69

kaldi::MatrixBase::SetRandn
void SetRandn()
Sets to random values of a normal distribution.
Definition: kaldi-matrix.cc:1355

kaldi::Rand
int Rand(struct RandomState *state)
Definition: kaldi-math.cc:45

fmllr-raw.h

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::g_kaldi_verbose_level
int32 g_kaldi_verbose_level
This is set by util/parse-options.
Definition: kaldi-error.cc:46

kaldi::FmllrRawAccs
Definition: fmllr-raw.h:81

kaldi::DiagGmm
Definition for Gaussian Mixture Model with diagonal covariances.
Definition: diag-gmm.h:42

kaldi::FmllrRawAccs::AccumulateForGmm
BaseFloat AccumulateForGmm(const DiagGmm &gmm, const VectorBase< BaseFloat > &data, BaseFloat weight)
Accumulate stats for a single GMM in the model; returns log likelihood.
Definition: fmllr-raw.cc:107

fmllr-diag-gmm.h

kaldi::ApplyAffineTransform
void ApplyAffineTransform(const MatrixBase< BaseFloat > &xform, VectorBase< BaseFloat > *vec)
Applies the affine transform &#39;xform&#39; to the vector &#39;vec&#39; and overwrites the contents of &#39;vec&#39;...
Definition: transform-common.cc:168

kaldi::SubMatrix
Sub-matrix representation.
Definition: kaldi-matrix.h:988

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501

main
int main()
Definition: fmllr-raw-test.cc:116