doc/gmm-init-model-flat_8cc_source.html

 // gmmbin/gmm-init-model-flat.cc

 // Copyright 2012  Johns Hopkins University (Author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "gmm/am-diag-gmm.h"
 #include "hmm/transition-model.h"
 #include "gmm/mle-am-diag-gmm.h"
 #include "tree/build-tree-utils.h"
 #include "tree/context-dep.h"
 #include "tree/clusterable-classes.h"
 #include "util/text-utils.h"

 namespace kaldi {

 void GetFeatureMeanAndVariance(const std::string &feat_rspecifier,
                                Vector<BaseFloat> *inv_var_out,
                                Vector<BaseFloat> *mean_out) {
   double count = 0.0;
   Vector<double> x_stats, x2_stats;

   SequentialDoubleMatrixReader feat_reader(feat_rspecifier);
   for (; !feat_reader.Done(); feat_reader.Next()) {
     const Matrix<double> &mat = feat_reader.Value();
     if (x_stats.Dim() == 0) {
       int32 dim = mat.NumCols();
       x_stats.Resize(dim);
       x2_stats.Resize(dim);
     }
     for (int32 i = 0; i < mat.NumRows(); i++) {
       count += 1.0;
       x_stats.AddVec(1.0, mat.Row(i));
       x2_stats.AddVec2(1.0, mat.Row(i));
     }
   }
   if (count == 0) { KALDI_ERR << "No features were read!"; }
   x_stats.Scale(1.0/count);
   x2_stats.Scale(1.0/count);
   x2_stats.AddVec2(-1.0, x_stats);
   if (x2_stats.Min() <= 0.0)
     KALDI_ERR << "Variance is zero or negative!";
   x2_stats.InvertElements();
   int32 dim = x_stats.Dim();
   inv_var_out->Resize(dim);
   mean_out->Resize(dim);
   inv_var_out->CopyFromVec(x2_stats);
   mean_out->CopyFromVec(x_stats);
 }


 }

 int main(int argc, char *argv[]) {
   using namespace kaldi;
   try {
     using namespace kaldi;
     typedef kaldi::int32 int32;

     const char *usage =
         "Initialize GMM, with Gaussians initialized to mean and variance\n"
         "of some provided example data (or to 0,1 if not provided: in that\n"
         "case, provide --dim option)\n"
         "Usage:  gmm-init-model-flat [options] <tree-in> <topo-file> <model-out> [<features-rspecifier>]\n"
         "e.g.: \n"
         "  gmm-init-model-flat tree topo 1.mdl ark:feats.scp\n";

     bool binary = true;
     int32 dim = 40;

     ParseOptions po(usage);
     po.Register("binary", &binary, "Write output in binary mode");
     po.Register("dim", &dim, "Dimension of model (this matters only if not providing features).");

     po.Read(argc, argv);

     if (po.NumArgs() < 3 || po.NumArgs() > 4) {
       po.PrintUsage();
       exit(1);
     }

     std::string
         tree_filename = po.GetArg(1),
         topo_filename = po.GetArg(2),
         model_out_filename = po.GetArg(3),
         feats_rspecifier = po.GetOptArg(4);

     ContextDependency ctx_dep;
     ReadKaldiObject(tree_filename, &ctx_dep);

     HmmTopology topo;
     ReadKaldiObject(topo_filename, &topo);

     Vector<BaseFloat> global_inverse_var, global_mean;
     if (po.NumArgs() == 4) {
       GetFeatureMeanAndVariance(feats_rspecifier,
                                 &global_inverse_var,
                                 &global_mean);
       dim = global_mean.Dim();
     } else {
       global_inverse_var.Resize(dim);
       global_inverse_var.Set(1.0);
       global_mean.Resize(dim); // leave it at zero.
     }

     int32 num_pdfs = ctx_dep.NumPdfs();

     AmDiagGmm am_gmm;
     DiagGmm gmm;
     gmm.Resize(1, dim);
     {  // Initialize the gmm.
       Matrix<BaseFloat> inv_var(1, dim);
       inv_var.Row(0).CopyFromVec(global_inverse_var);
       Matrix<BaseFloat> mu(1, dim);
       mu.Row(0).CopyFromVec(global_mean);
       Vector<BaseFloat> weights(1);
       weights.Set(1.0);
       gmm.SetInvVarsAndMeans(inv_var, mu);
       gmm.SetWeights(weights);
       gmm.ComputeGconsts();
     }
     for (int i = 0; i < num_pdfs; i++)
       am_gmm.AddPdf(gmm);

     TransitionModel trans_model(ctx_dep, topo);

     {
       Output ko(model_out_filename, binary);
       trans_model.Write(ko.Stream(), binary);
       am_gmm.Write(ko.Stream(), binary);
     }
     KALDI_LOG << "Wrote model.";
   } catch(const std::exception &e) {
     std::cerr << e.what();
     return -1;
   }
 }
am-diag-gmm.h

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::AmDiagGmm::AddPdf
void AddPdf(const DiagGmm &gmm)
Adds a GMM to the model, and increments the total number of PDFs.
Definition: am-diag-gmm.cc:57

mle-am-diag-gmm.h

kaldi::DiagGmm::SetInvVarsAndMeans
void SetInvVarsAndMeans(const MatrixBase< Real > &invvars, const MatrixBase< Real > &means)
Use SetInvVarsAndMeans if updating both means and (inverse) variances.
Definition: diag-gmm-inl.h:63

kaldi::HmmTopology
A class for storing topology information for phones.
Definition: hmm-topology.h:93

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::DiagGmm::Resize
void Resize(int32 nMix, int32 dim)
Resizes arrays to this dim. Does not initialize data.
Definition: diag-gmm.cc:66

kaldi::DiagGmm::ComputeGconsts
int32 ComputeGconsts()
Sets the gconsts.
Definition: diag-gmm.cc:114

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::Matrix< double >

kaldi::Vector::Resize
void Resize(MatrixIndexT length, MatrixResizeType resize_type=kSetZero)
Set vector to a specified size (can be zero).
Definition: kaldi-vector.cc:190

kaldi::VectorBase::Min
Real Min() const
Returns the minimum value of any element, or +infinity for the empty vector.
Definition: kaldi-vector.cc:614

kaldi::ContextDependency
Definition: context-dep.h:59

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::AmDiagGmm
Definition: am-diag-gmm.h:36

kaldi::TransitionModel
Definition: transition-model.h:123

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

text-utils.h

kaldi::VectorBase::AddVec2
void AddVec2(const Real alpha, const VectorBase< Real > &v)
Add vector : *this = *this + alpha * rv^2 [element-wise squaring].
Definition: kaldi-vector.cc:1255

kaldi::ContextDependency::NumPdfs
virtual int32 NumPdfs() const
NumPdfs() returns the number of acoustic pdfs (they are numbered 0.. NumPdfs()-1).
Definition: context-dep.h:71

kaldi::VectorBase::CopyFromVec
void CopyFromVec(const VectorBase< Real > &v)
Copy data from another vector (must match own size).
Definition: kaldi-vector.cc:228

count
const size_t count
Definition: arpa-file-parser-test.cc:66

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

kaldi::Output::Stream
std::ostream & Stream()
Definition: kaldi-io.cc:701

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

transition-model.h

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::VectorBase::Scale
void Scale(Real alpha)
Multiplies all elements by this constant.
Definition: kaldi-vector.cc:963

build-tree-utils.h

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

kaldi::TransitionModel::Write
void Write(std::ostream &os, bool binary) const
Definition: transition-model.cc:422

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::VectorBase::InvertElements
void InvertElements()
Invert all elements.
Definition: kaldi-vector.cc:776

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::VectorBase::Set
void Set(Real f)
Set all members of a vector to a specified value.
Definition: kaldi-vector.cc:336

kaldi::AmDiagGmm::Write
void Write(std::ostream &out_stream, bool binary) const
Definition: am-diag-gmm.cc:163

kaldi::DiagGmm
Definition for Gaussian Mixture Model with diagonal covariances.
Definition: diag-gmm.h:42

clusterable-classes.h

kaldi::Output
Definition: kaldi-io.h:124

kaldi::DiagGmm::SetWeights
void SetWeights(const VectorBase< Real > &w)
Mutators for both float or double.
Definition: diag-gmm-inl.h:28

main
int main(int argc, char *argv[])
Definition: gmm-init-model-flat.cc:70

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::VectorBase::AddVec
void AddVec(const Real alpha, const VectorBase< OtherReal > &v)
Add vector : *this = *this + alpha * rv (with casting between floats and doubles) ...
Definition: kaldi-vector.cc:1044

context-dep.h

kaldi-common.h

kaldi::GetFeatureMeanAndVariance
void GetFeatureMeanAndVariance(const std::string &feat_rspecifier, Vector< BaseFloat > *inv_var_out, Vector< BaseFloat > *mean_out)
Definition: gmm-init-model-flat.cc:33

kaldi::ParseOptions::GetOptArg
std::string GetOptArg(int param) const
Definition: parse-options.h:127