doc/mle-diag-gmm_8cc_source.html

 // gmm/mle-diag-gmm.cc

 // Copyright 2009-2013  Saarland University;  Georg Stemmer;  Jan Silovsky;
 //                      Microsoft Corporation; Yanmin Qian;
 //                      Johns Hopkins University (author: Daniel Povey);
 //                      Cisco Systems (author: Neha Agrawal)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <algorithm>  // for std::max
 #include <string>
 #include <vector>

 #include "gmm/diag-gmm.h"
 #include "gmm/mle-diag-gmm.h"
 #include "util/kaldi-thread.h"

 namespace kaldi {

 void AccumDiagGmm::Read(std::istream &in_stream, bool binary, bool add) {
   int32 dimension, num_components;
   GmmFlagsType flags;
   std::string token;

   ExpectToken(in_stream, binary, "<GMMACCS>");
   ExpectToken(in_stream, binary, "<VECSIZE>");
   ReadBasicType(in_stream, binary, &dimension);
   ExpectToken(in_stream, binary, "<NUMCOMPONENTS>");
   ReadBasicType(in_stream, binary, &num_components);
   ExpectToken(in_stream, binary, "<FLAGS>");
   ReadBasicType(in_stream, binary, &flags);

   if (add) {
     if ((NumGauss() != 0 || Dim() != 0 || Flags() != 0)) {
       if (num_components != NumGauss() || dimension != Dim()
           || flags != Flags())
         KALDI_ERR << "MlEstimatediagGmm::Read, dimension or flags mismatch, "
                   << NumGauss() << ", " << Dim() << ", "
                   << GmmFlagsToString(Flags()) << " vs. " << num_components << ", "
                   << dimension << ", " << flags << " (mixing accs from different "
                   << "models?";
     } else {
       Resize(num_components, dimension, flags);
     }
   } else {
     Resize(num_components, dimension, flags);
   }

   ReadToken(in_stream, binary, &token);
   while (token != "</GMMACCS>") {
     if (token == "<OCCUPANCY>") {
       occupancy_.Read(in_stream, binary, add);
     } else if (token == "<MEANACCS>") {
       mean_accumulator_.Read(in_stream, binary, add);
     } else if (token == "<DIAGVARACCS>") {
       variance_accumulator_.Read(in_stream, binary, add);
     } else {
       KALDI_ERR << "Unexpected token '" << token << "' in model file ";
     }
     ReadToken(in_stream, binary, &token);
   }
 }

 void AccumDiagGmm::Write(std::ostream &out_stream, bool binary) const {
   WriteToken(out_stream, binary, "<GMMACCS>");
   WriteToken(out_stream, binary, "<VECSIZE>");
   WriteBasicType(out_stream, binary, dim_);
   WriteToken(out_stream, binary, "<NUMCOMPONENTS>");
   WriteBasicType(out_stream, binary, num_comp_);
   WriteToken(out_stream, binary, "<FLAGS>");
   WriteBasicType(out_stream, binary, flags_);

   // convert into BaseFloat before writing things
   Vector<BaseFloat> occupancy_bf(occupancy_.Dim());
   Matrix<BaseFloat> mean_accumulator_bf(mean_accumulator_.NumRows(),
                                         mean_accumulator_.NumCols());
   Matrix<BaseFloat> variance_accumulator_bf(variance_accumulator_.NumRows(),
                                             variance_accumulator_.NumCols());
   occupancy_bf.CopyFromVec(occupancy_);
   mean_accumulator_bf.CopyFromMat(mean_accumulator_);
   variance_accumulator_bf.CopyFromMat(variance_accumulator_);

   WriteToken(out_stream, binary, "<OCCUPANCY>");
   occupancy_bf.Write(out_stream, binary);
   WriteToken(out_stream, binary, "<MEANACCS>");
   mean_accumulator_bf.Write(out_stream, binary);
   WriteToken(out_stream, binary, "<DIAGVARACCS>");
   variance_accumulator_bf.Write(out_stream, binary);
   WriteToken(out_stream, binary, "</GMMACCS>");
 }


 void AccumDiagGmm::Resize(int32 num_comp, int32 dim, GmmFlagsType flags) {
   KALDI_ASSERT(num_comp > 0 && dim > 0);
   num_comp_ = num_comp;
   dim_ = dim;
   flags_ = AugmentGmmFlags(flags);
   occupancy_.Resize(num_comp);
   if (flags_ & kGmmMeans)
     mean_accumulator_.Resize(num_comp, dim);
   else
     mean_accumulator_.Resize(0, 0);
   if (flags_ & kGmmVariances)
     variance_accumulator_.Resize(num_comp, dim);
   else
     variance_accumulator_.Resize(0, 0);
 }

 void AccumDiagGmm::SetZero(GmmFlagsType flags) {
   if (flags & ~flags_)
     KALDI_ERR << "Flags in argument do not match the active accumulators";
   if (flags & kGmmWeights) occupancy_.SetZero();
   if (flags & kGmmMeans) mean_accumulator_.SetZero();
   if (flags & kGmmVariances) variance_accumulator_.SetZero();
 }


 void AccumDiagGmm::Scale(BaseFloat f, GmmFlagsType flags) {
   if (flags & ~flags_)
     KALDI_ERR << "Flags in argument do not match the active accumulators";
   double d = static_cast<double>(f);
   if (flags & kGmmWeights) occupancy_.Scale(d);
   if (flags & kGmmMeans) mean_accumulator_.Scale(d);
   if (flags & kGmmVariances) variance_accumulator_.Scale(d);
 }

 void AccumDiagGmm::AccumulateForComponent(const VectorBase<BaseFloat> &data,
                                           int32 comp_index, BaseFloat weight) {
   if (flags_ & kGmmMeans)
     KALDI_ASSERT(data.Dim() == Dim());
   double wt = static_cast<double>(weight);
   KALDI_ASSERT(comp_index < NumGauss());
   // accumulate
   occupancy_(comp_index) += wt;
   if (flags_ & kGmmMeans) {
     Vector<double> data_d(data);  // Copy with type-conversion
     mean_accumulator_.Row(comp_index).AddVec(wt, data_d);
     if (flags_ & kGmmVariances) {
       data_d.ApplyPow(2.0);
       variance_accumulator_.Row(comp_index).AddVec(wt, data_d);
     }
   }
 }

 void AccumDiagGmm::AddStatsForComponent(int32 g,
                                         double occ,
                                         const VectorBase<double> &x_stats,
                                         const VectorBase<double> &x2_stats) {
   KALDI_ASSERT(g < NumGauss());
   occupancy_(g) += occ;
   if (flags_ & kGmmMeans)
     mean_accumulator_.Row(g).AddVec(1.0, x_stats);
   if (flags_ & kGmmVariances)
     variance_accumulator_.Row(g).AddVec(1.0, x2_stats);
 }


 void AccumDiagGmm::AccumulateFromPosteriors(
     const VectorBase<BaseFloat> &data,
     const VectorBase<BaseFloat> &posteriors) {
   if (flags_ & kGmmMeans)
     KALDI_ASSERT(static_cast<int32>(data.Dim()) == Dim());
   KALDI_ASSERT(static_cast<int32>(posteriors.Dim()) == NumGauss());
   Vector<double> post_d(posteriors);  // Copy with type-conversion

   // accumulate
   occupancy_.AddVec(1.0, post_d);
   if (flags_ & kGmmMeans) {
     Vector<double> data_d(data);  // Copy with type-conversion
     mean_accumulator_.AddVecVec(1.0, post_d, data_d);
     if (flags_ & kGmmVariances) {
       data_d.ApplyPow(2.0);
       variance_accumulator_.AddVecVec(1.0, post_d, data_d);
     }
   }
 }

 BaseFloat AccumDiagGmm::AccumulateFromDiag(const DiagGmm &gmm,
                                            const VectorBase<BaseFloat> &data,
                                            BaseFloat frame_posterior) {
   KALDI_ASSERT(gmm.NumGauss() == NumGauss());
   KALDI_ASSERT(gmm.Dim() == Dim());
   KALDI_ASSERT(static_cast<int32>(data.Dim()) == Dim());

   Vector<BaseFloat> posteriors(NumGauss());
   BaseFloat log_like = gmm.ComponentPosteriors(data, &posteriors);
   posteriors.Scale(frame_posterior);

   AccumulateFromPosteriors(data, posteriors);
   return log_like;
 }

 // Careful: this wouldn't be valid if it were used to update the
 // Gaussian weights.
 void AccumDiagGmm::SmoothStats(BaseFloat tau) {
   Vector<double> smoothing_vec(occupancy_);
   smoothing_vec.InvertElements();
   smoothing_vec.Scale(static_cast<double>(tau));
   smoothing_vec.Add(1.0);
   // now smoothing_vec = (tau + occ) / occ

   mean_accumulator_.MulRowsVec(smoothing_vec);
   variance_accumulator_.MulRowsVec(smoothing_vec);
   occupancy_.Add(static_cast<double>(tau));
 }


 // want to add tau "virtual counts" of each Gaussian from "src_acc"
 // to each Gaussian in this acc.
 // Careful: this wouldn't be valid if it were used to update the
 // Gaussian weights.
 void AccumDiagGmm::SmoothWithAccum(BaseFloat tau, const AccumDiagGmm &src_acc) {
   KALDI_ASSERT(src_acc.NumGauss() == num_comp_ && src_acc.Dim() == dim_);
   for (int32 i = 0; i < num_comp_; i++) {
     if (src_acc.occupancy_(i) != 0.0) { // can only smooth if src was nonzero...
       occupancy_(i) += tau;
       mean_accumulator_.Row(i).AddVec(tau / src_acc.occupancy_(i),
                                       src_acc.mean_accumulator_.Row(i));
       variance_accumulator_.Row(i).AddVec(tau / src_acc.occupancy_(i),
                                           src_acc.variance_accumulator_.Row(i));
     } else
       KALDI_WARN << "Could not smooth since source acc had zero occupancy.";
   }
 }


 void AccumDiagGmm::SmoothWithModel(BaseFloat tau, const DiagGmm &gmm) {
   KALDI_ASSERT(gmm.NumGauss() == num_comp_ && gmm.Dim() == dim_);
   Matrix<double> means(num_comp_, dim_);
   Matrix<double> vars(num_comp_, dim_);
   gmm.GetMeans(&means);
   gmm.GetVars(&vars);

   mean_accumulator_.AddMat(tau, means);
   means.ApplyPow(2.0);
   vars.AddMat(1.0, means, kNoTrans);
   variance_accumulator_.AddMat(tau, vars);

   occupancy_.Add(tau);
 }

 AccumDiagGmm::AccumDiagGmm(const AccumDiagGmm &other)
     : dim_(other.dim_), num_comp_(other.num_comp_),
       flags_(other.flags_), occupancy_(other.occupancy_),
       mean_accumulator_(other.mean_accumulator_),
       variance_accumulator_(other.variance_accumulator_) {}

 BaseFloat MlObjective(const DiagGmm &gmm,
                       const AccumDiagGmm &diag_gmm_acc) {
   GmmFlagsType acc_flags = diag_gmm_acc.Flags();
   Vector<BaseFloat> occ_bf(diag_gmm_acc.occupancy());
   Matrix<BaseFloat> mean_accs_bf(diag_gmm_acc.mean_accumulator());
   Matrix<BaseFloat> variance_accs_bf(diag_gmm_acc.variance_accumulator());
   BaseFloat obj = VecVec(occ_bf, gmm.gconsts());
   if (acc_flags & kGmmMeans)
     obj += TraceMatMat(mean_accs_bf, gmm.means_invvars(), kTrans);
   if (acc_flags & kGmmVariances)
     obj -= 0.5 * TraceMatMat(variance_accs_bf, gmm.inv_vars(), kTrans);
   return obj;
 }

 void MleDiagGmmUpdate(const MleDiagGmmOptions &config,
                       const AccumDiagGmm &diag_gmm_acc,
                       GmmFlagsType flags,
                       DiagGmm *gmm,
                       BaseFloat *obj_change_out,
                       BaseFloat *count_out,
                       int32 *floored_elements_out,
                       int32 *floored_gaussians_out,
                       int32 *removed_gaussians_out) {
   KALDI_ASSERT(gmm != NULL);

   if (flags & ~diag_gmm_acc.Flags())
     KALDI_ERR << "Flags in argument do not match the active accumulators";

   KALDI_ASSERT(diag_gmm_acc.NumGauss() == gmm->NumGauss() &&
                diag_gmm_acc.Dim() == gmm->Dim());

   int32 num_gauss = gmm->NumGauss();
   double occ_sum = diag_gmm_acc.occupancy().Sum();

   int32 elements_floored = 0, gauss_floored = 0;

   // remember old objective value
   gmm->ComputeGconsts();
   BaseFloat obj_old = MlObjective(*gmm, diag_gmm_acc);

   // First get the gmm in "normal" representation (not the exponential-model
   // form).
   DiagGmmNormal ngmm(*gmm);

   std::vector<int32> to_remove;
   for (int32 i = 0; i < num_gauss; i++) {
     double occ = diag_gmm_acc.occupancy()(i);
     double prob;
     if (occ_sum > 0.0)
       prob = occ / occ_sum;
     else
       prob = 1.0 / num_gauss;

     if (occ > static_cast<double>(config.min_gaussian_occupancy)
         && prob > static_cast<double>(config.min_gaussian_weight)) {

       ngmm.weights_(i) = prob;

       // copy old mean for later normalizations
       Vector<double> old_mean(ngmm.means_.Row(i));

       // update mean, then variance, as far as there are accumulators
       if (diag_gmm_acc.Flags() & (kGmmMeans|kGmmVariances)) {
         Vector<double> mean(diag_gmm_acc.mean_accumulator().Row(i));
         mean.Scale(1.0 / occ);
         // transfer to estimate
         ngmm.means_.CopyRowFromVec(mean, i);
       }

       if (diag_gmm_acc.Flags() & kGmmVariances) {
         KALDI_ASSERT(diag_gmm_acc.Flags() & kGmmMeans);
         Vector<double> var(diag_gmm_acc.variance_accumulator().Row(i));
         var.Scale(1.0 / occ);
         var.AddVec2(-1.0, ngmm.means_.Row(i));  // subtract squared means.

         // if we intend to only update the variances, we need to compensate by
         // adding the difference between the new and old mean
         if (!(flags & kGmmMeans)) {
           old_mean.AddVec(-1.0, ngmm.means_.Row(i));
           var.AddVec2(1.0, old_mean);
         }
         int32 floored;
         if (config.variance_floor_vector.Dim() != 0) {
           floored = var.ApplyFloor(config.variance_floor_vector);
         } else {
           var.ApplyFloor(config.min_variance, &floored);
         }
         if (floored != 0) {
           elements_floored += floored;
           gauss_floored++;
         }
         // transfer to estimate
         ngmm.vars_.CopyRowFromVec(var, i);
       }
     } else {  // Insufficient occupancy.
       if (config.remove_low_count_gaussians &&
           static_cast<int32>(to_remove.size()) < num_gauss-1) {
         // remove the component, unless it is the last one.
         KALDI_WARN << "Too little data - removing Gaussian (weight "
                    << std::fixed << prob
                    << ", occupation count " << std::fixed << diag_gmm_acc.occupancy()(i)
                    << ", vector size " << gmm->Dim() << ")";
         to_remove.push_back(i);
       } else {
         KALDI_WARN << "Gaussian has too little data but not removing it because"
                    << (config.remove_low_count_gaussians ?
                        " it is the last Gaussian: i = "
                        : " remove-low-count-gaussians == false: g = ") << i
                    << ", occ = " << diag_gmm_acc.occupancy()(i) << ", weight = " << prob;
         ngmm.weights_(i) =
             std::max(prob, static_cast<double>(config.min_gaussian_weight));
       }
     }
   }

   // copy to natural representation according to flags
   ngmm.CopyToDiagGmm(gmm, flags);

   gmm->ComputeGconsts();  // or MlObjective will fail.
   BaseFloat obj_new = MlObjective(*gmm, diag_gmm_acc);

   if (obj_change_out)
     *obj_change_out = (obj_new - obj_old);
   if (count_out) *count_out = occ_sum;
   if (floored_elements_out) *floored_elements_out = elements_floored;
   if (floored_gaussians_out) *floored_gaussians_out = gauss_floored;

   if (to_remove.size() > 0) {
     gmm->RemoveComponents(to_remove, true /*renormalize weights*/);
     gmm->ComputeGconsts();
   }
   if (removed_gaussians_out != NULL) *removed_gaussians_out = to_remove.size();

   if (gauss_floored > 0)
     KALDI_VLOG(2) << gauss_floored << " variances floored in " << gauss_floored
                   << " Gaussians.";
 }

 void AccumDiagGmm::Add(double scale, const AccumDiagGmm &acc) {
   // The functions called here will crash if the dimensions etc.
   // or the flags don't match.
   occupancy_.AddVec(scale, acc.occupancy_);
   if (flags_ & kGmmMeans)
     mean_accumulator_.AddMat(scale, acc.mean_accumulator_);
   if (flags_ & kGmmVariances)
     variance_accumulator_.AddMat(scale, acc.variance_accumulator_);
 }


 void MapDiagGmmUpdate(const MapDiagGmmOptions &config,
                       const AccumDiagGmm &diag_gmm_acc,
                       GmmFlagsType flags,
                       DiagGmm *gmm,
                       BaseFloat *obj_change_out,
                       BaseFloat *count_out) {
   KALDI_ASSERT(gmm != NULL);

   if (flags & ~diag_gmm_acc.Flags())
     KALDI_ERR << "Flags in argument do not match the active accumulators";

   KALDI_ASSERT(diag_gmm_acc.NumGauss() == gmm->NumGauss() &&
                diag_gmm_acc.Dim() == gmm->Dim());

   int32 num_gauss = gmm->NumGauss();
   double occ_sum = diag_gmm_acc.occupancy().Sum();

   // remember the old objective function value
   gmm->ComputeGconsts();
   BaseFloat obj_old = MlObjective(*gmm, diag_gmm_acc);

   // allocate the gmm in normal representation; all parameters of this will be
   // updated, but only the flagged ones will be transferred back to gmm
   DiagGmmNormal ngmm(*gmm);

   for (int32 i = 0; i < num_gauss; i++) {
     double occ = diag_gmm_acc.occupancy()(i);

     // First update the weight.  The weight_tau is a tau for the
     // whole state.
     ngmm.weights_(i) = (occ + ngmm.weights_(i) * config.weight_tau) /
         (occ_sum + config.weight_tau);


     if (occ > 0.0 && (flags & kGmmMeans)) {
       // Update the Gaussian mean.
       Vector<double> old_mean(ngmm.means_.Row(i));
       Vector<double> mean(diag_gmm_acc.mean_accumulator().Row(i));
       mean.Scale(1.0 / (occ + config.mean_tau));
       mean.AddVec(config.mean_tau / (occ + config.mean_tau), old_mean);
       ngmm.means_.CopyRowFromVec(mean, i);
     }

     if (occ > 0.0 && (flags & kGmmVariances)) {
       // Computing the variance around the updated mean; this is:
       // E( (x - mu)^2 ) = E( x^2 - 2 x mu + mu^2 ) =
       // E(x^2) + mu^2 - 2 mu E(x).
       Vector<double> old_var(ngmm.vars_.Row(i));
       Vector<double> var(diag_gmm_acc.variance_accumulator().Row(i));
       var.Scale(1.0 / occ);
       var.AddVec2(1.0, ngmm.means_.Row(i));
       SubVector<double> mean_acc(diag_gmm_acc.mean_accumulator(), i),
           mean(ngmm.means_, i);
       var.AddVecVec(-2.0 / occ, mean_acc, mean, 1.0);
       // now var is E(x^2) + m^2 - 2 mu E(x).
       // Next we do the appropriate weighting usnig the tau value.
       var.Scale(occ / (config.variance_tau + occ));
       var.AddVec(config.variance_tau / (config.variance_tau + occ), old_var);
       // Now write to the model.
       ngmm.vars_.Row(i).CopyFromVec(var);
     }
   }

   // Copy to natural/exponential representation.
   ngmm.CopyToDiagGmm(gmm, flags);

   gmm->ComputeGconsts();  // or MlObjective will fail.
   BaseFloat obj_new = MlObjective(*gmm, diag_gmm_acc);

   if (obj_change_out)
     *obj_change_out = (obj_new - obj_old);

   if (count_out) *count_out = occ_sum;
 }


 class AccumulateMultiThreadedClass: public MultiThreadable {
  public:
   AccumulateMultiThreadedClass(const DiagGmm &diag_gmm,
                                const MatrixBase<BaseFloat> &data,
                                const VectorBase<BaseFloat> &frame_weights,
                                AccumDiagGmm *accum,
                                double *tot_like):
       diag_gmm_(diag_gmm), data_(data),
       frame_weights_(frame_weights), dest_accum_(accum),
       tot_like_ptr_(tot_like), tot_like_(0.0) { }
   AccumulateMultiThreadedClass(const AccumulateMultiThreadedClass &other):
     MultiThreadable(other),
     diag_gmm_(other.diag_gmm_), data_(other.data_),
     frame_weights_(other.frame_weights_), dest_accum_(other.dest_accum_),
     accum_(diag_gmm_, dest_accum_->Flags()), tot_like_ptr_(other.tot_like_ptr_),
     tot_like_(0.0) {
     KALDI_ASSERT(data_.NumRows() == frame_weights_.Dim());
   }
   void operator () () {
     int32 num_frames = data_.NumRows(), num_threads = num_threads_,
         block_size = (num_frames + num_threads - 1) / num_threads,
         block_start = block_size * thread_id_,
         block_end = std::min(num_frames, block_start + block_size);
     tot_like_ = 0.0;
     double tot_weight = 0.0;
     for (int32 t = block_start; t < block_end; t++) {
       tot_like_ += frame_weights_(t) *
           accum_.AccumulateFromDiag(diag_gmm_, data_.Row(t), frame_weights_(t));
       tot_weight += frame_weights_(t);
     }
     KALDI_VLOG(3) << "Thread " << thread_id_ << " saw average likeliood/frame "
                   << (tot_like_ / tot_weight) << " over " << tot_weight
                   << " (weighted) frames.";
   }
   ~AccumulateMultiThreadedClass() {
     if (accum_.Dim() != 0) { // if our accumulator is set up (this is not true
       // for the single object we use to initialize the others)
       dest_accum_->Add(1.0, accum_);
       *tot_like_ptr_ += tot_like_;
     }
   }
  private:
   const DiagGmm &diag_gmm_;
   const MatrixBase<BaseFloat> &data_;
   const VectorBase<BaseFloat> &frame_weights_;
   AccumDiagGmm *dest_accum_;
   AccumDiagGmm accum_;
   double *tot_like_ptr_;
   double tot_like_;
 };


 BaseFloat AccumDiagGmm::AccumulateFromDiagMultiThreaded(
     const DiagGmm &gmm,
     const MatrixBase<BaseFloat> &data,
     const VectorBase<BaseFloat> &frame_weights,
     int32 num_threads) {

   double tot_like = 0.0;
   AccumulateMultiThreadedClass accumulator(gmm, data, frame_weights,
                                            this, &tot_like);
   {
     // Note: everything happens in the constructor and destructor of
     // the object created below.
     MultiThreader<AccumulateMultiThreadedClass> threader(num_threads,
                                                          accumulator);
     // we need to make sure it's destroyed before we access the
     // value of tot_like.
   }
   return tot_like;
 }

 void AccumDiagGmm::AssertEqual(const AccumDiagGmm &other) {
   KALDI_ASSERT(dim_ == other.dim_ && num_comp_ == other.num_comp_ &&
                flags_ == other.flags_);
   KALDI_ASSERT(occupancy_.ApproxEqual(other.occupancy_));
   KALDI_ASSERT(mean_accumulator_.ApproxEqual(other.mean_accumulator_));
   KALDI_ASSERT(variance_accumulator_.ApproxEqual(other.variance_accumulator_));
 }


 }  // End of namespace kaldi
kaldi::VectorBase::ApproxEqual
bool ApproxEqual(const VectorBase< Real > &other, float tol=0.01) const
Returns true if ((*this)-other).Norm(2.0) <= tol * (*this).Norm(2.0).
Definition: kaldi-vector.cc:556

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::DiagGmm::Dim
int32 Dim() const
Returns the dimensionality of the Gaussian mean vectors.
Definition: diag-gmm.h:74

kaldi::MapDiagGmmUpdate
void MapDiagGmmUpdate(const MapDiagGmmOptions &config, const AccumDiagGmm &diag_gmm_acc, GmmFlagsType flags, DiagGmm *gmm, BaseFloat *obj_change_out, BaseFloat *count_out)
Maximum A Posteriori estimation of the model.
Definition: mle-diag-gmm.cc:410

kaldi::MleDiagGmmOptions::remove_low_count_gaussians
bool remove_low_count_gaussians
Definition: mle-diag-gmm.h:51

kaldi::AugmentGmmFlags
GmmFlagsType AugmentGmmFlags(GmmFlagsType f)
Returns "augmented" version of flags: e.g.
Definition: model-common.cc:52

kaldi::MapDiagGmmOptions::weight_tau
BaseFloat weight_tau
Tau value for the weights– this tau value is applied per state, not per Gaussian.
Definition: mle-diag-gmm.h:87

diag-gmm.h

kaldi::AccumDiagGmm::AccumulateFromDiagMultiThreaded
BaseFloat AccumulateFromDiagMultiThreaded(const DiagGmm &gmm, const MatrixBase< BaseFloat > &data, const VectorBase< BaseFloat > &frame_weights, int32 num_threads)
This does the same job as AccumulateFromDiag, but using multiple threads.
Definition: mle-diag-gmm.cc:538

kaldi-thread.h

kaldi::DiagGmmNormal
Definition for Gaussian Mixture Model with diagonal covariances in normal mode: where the parameters ...
Definition: diag-gmm-normal.h:45

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::MatrixBase
Base class which provides matrix operations not involving resizing or allocation. ...
Definition: kaldi-matrix.h:49

kaldi::DiagGmm::means_invvars
const Matrix< BaseFloat > & means_invvars() const
Definition: diag-gmm.h:179

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::MleDiagGmmOptions::min_gaussian_occupancy
BaseFloat min_gaussian_occupancy
Minimum count below which a Gaussian is not updated (and is removed, if remove_low_count_gaussians ==...
Definition: mle-diag-gmm.h:47

kaldi::MleDiagGmmUpdate
void MleDiagGmmUpdate(const MleDiagGmmOptions &config, const AccumDiagGmm &diag_gmm_acc, GmmFlagsType flags, DiagGmm *gmm, BaseFloat *obj_change_out, BaseFloat *count_out, int32 *floored_elements_out, int32 *floored_gaussians_out, int32 *removed_gaussians_out)
for computing the maximum-likelihood estimates of the parameters of a Gaussian mixture model...
Definition: mle-diag-gmm.cc:275

kaldi::MultiThreader
Definition: kaldi-thread.h:117

mle-diag-gmm.h

kaldi::MatrixBase::ApproxEqual
bool ApproxEqual(const MatrixBase< Real > &other, float tol=0.01) const
Returns true if ((*this)-other).FrobeniusNorm() <= tol * (*this).FrobeniusNorm(). ...
Definition: kaldi-matrix.cc:1915

kaldi::AccumDiagGmm
Definition: mle-diag-gmm.h:106

kaldi::AccumDiagGmm::dim_
int32 dim_
Definition: mle-diag-gmm.h:190

kaldi::MlObjective
BaseFloat MlObjective(const DiagGmm &gmm, const AccumDiagGmm &diag_gmm_acc)
Calc using the DiagGMM exponential form.
Definition: mle-diag-gmm.cc:261

kaldi::DiagGmm::gconsts
const Vector< BaseFloat > & gconsts() const
Const accessors.
Definition: diag-gmm.h:174

kaldi::MatrixBase::AddMat
void AddMat(const Real alpha, const MatrixBase< Real > &M, MatrixTransposeType transA=kNoTrans)
*this += alpha * M [or M^T]
Definition: kaldi-matrix.cc:356

kaldi::AccumDiagGmm::mean_accumulator_
Matrix< double > mean_accumulator_
Definition: mle-diag-gmm.h:196

kaldi::DiagGmm::ComputeGconsts
int32 ComputeGconsts()
Sets the gconsts.
Definition: diag-gmm.cc:114

kaldi::AccumDiagGmm::occupancy
const VectorBase< double > & occupancy() const
Definition: mle-diag-gmm.h:183

kaldi::AccumulateMultiThreadedClass
Definition: mle-diag-gmm.cc:486

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::Matrix< BaseFloat >

kaldi::GmmFlagsType
uint16 GmmFlagsType
Bitwise OR of the above flags.
Definition: model-common.h:35

kaldi::Vector::Resize
void Resize(MatrixIndexT length, MatrixResizeType resize_type=kSetZero)
Set vector to a specified size (can be zero).
Definition: kaldi-vector.cc:190

kaldi::AccumDiagGmm::num_comp_
int32 num_comp_
Definition: mle-diag-gmm.h:191

kaldi::MatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &M, MatrixTransposeType trans=kNoTrans)
Copy given matrix. (no resize is done).
Definition: kaldi-matrix.cc:862

kaldi::MleDiagGmmOptions::min_variance
double min_variance
Minimum allowed variance in any dimension (if no variance floor) It is in double since the variance i...
Definition: mle-diag-gmm.h:50

kaldi::AccumDiagGmm::Scale
void Scale(BaseFloat f, GmmFlagsType flags)
Definition: mle-diag-gmm.cc:131

data_
uint64 data_
Definition: arpa-lm-compiler.cc:108

kaldi::AccumDiagGmm::SmoothWithModel
void SmoothWithModel(BaseFloat tau, const DiagGmm &src_gmm)
Smooths the accumulated counts using the parameters of a given model.
Definition: mle-diag-gmm.cc:240

kaldi::AccumulateMultiThreadedClass::diag_gmm_
const DiagGmm & diag_gmm_
Definition: mle-diag-gmm.cc:528

kaldi::AccumDiagGmm::flags_
GmmFlagsType flags_
Flags corresponding to the accumulators that are stored.
Definition: mle-diag-gmm.h:193

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::DiagGmm::GetVars
void GetVars(Matrix< Real > *v) const
Accessor for covariances.
Definition: diag-gmm-inl.h:115

kaldi::Matrix::Read
void Read(std::istream &in, bool binary, bool add=false)
read from stream.
Definition: kaldi-matrix.cc:1450

kaldi::DiagGmm::ComponentPosteriors
BaseFloat ComponentPosteriors(const VectorBase< BaseFloat > &data, Vector< BaseFloat > *posteriors) const
Computes the posterior probabilities of all Gaussian components given a data point.
Definition: diag-gmm.cc:601

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::kGmmMeans
Definition: model-common.h:29

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

kaldi::AccumulateMultiThreadedClass::data_
const MatrixBase< BaseFloat > & data_
Definition: mle-diag-gmm.cc:529

float

kaldi::kGmmVariances
Definition: model-common.h:30

kaldi::AccumDiagGmm::variance_accumulator
const MatrixBase< double > & variance_accumulator() const
Definition: mle-diag-gmm.h:185

kaldi::MatrixBase::Scale
void Scale(Real alpha)
Multiply each element with a scalar value.
Definition: kaldi-matrix.cc:1209

kaldi::AccumDiagGmm::AccumulateFromDiag
BaseFloat AccumulateFromDiag(const DiagGmm &gmm, const VectorBase< BaseFloat > &data, BaseFloat frame_posterior)
Accumulate for all components given a diagonal-covariance GMM.
Definition: mle-diag-gmm.cc:191

kaldi::AccumDiagGmm::mean_accumulator
const MatrixBase< double > & mean_accumulator() const
Definition: mle-diag-gmm.h:184

kaldi::ExpectToken
void ExpectToken(std::istream &is, bool binary, const char *token)
ExpectToken tries to read in the given token, and throws an exception on failure. ...
Definition: io-funcs.cc:191

kaldi::AccumDiagGmm::Flags
GmmFlagsType Flags() const
Definition: mle-diag-gmm.h:182

kaldi::AccumDiagGmm::AddStatsForComponent
void AddStatsForComponent(int32 comp_id, double occ, const VectorBase< double > &x_stats, const VectorBase< double > &x2_stats)
Increment the stats for this component by the specified amount (not all parts may be taken...
Definition: mle-diag-gmm.cc:158

kaldi::DiagGmm::GetMeans
void GetMeans(Matrix< Real > *m) const
Accessor for means.
Definition: diag-gmm-inl.h:123

kaldi::AccumDiagGmm::Write
void Write(std::ostream &out_stream, bool binary) const
Definition: mle-diag-gmm.cc:77

kaldi::DiagGmm::RemoveComponents
void RemoveComponents(const std::vector< int32 > &gauss, bool renorm_weights)
Removes multiple components from model; "gauss" must not have dups.
Definition: diag-gmm.cc:632

kaldi::AccumDiagGmm::SmoothStats
void SmoothStats(BaseFloat tau)
Smooths the accumulated counts by adding &#39;tau&#39; extra frames.
Definition: mle-diag-gmm.cc:208

kaldi::AccumDiagGmm::AccumulateForComponent
void AccumulateForComponent(const VectorBase< BaseFloat > &data, int32 comp_index, BaseFloat weight)
Accumulate for a single component, given the posterior.
Definition: mle-diag-gmm.cc:140

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::AccumDiagGmm::Add
void Add(double scale, const AccumDiagGmm &acc)
Increment with stats from this other accumulator (times scale)
Definition: mle-diag-gmm.cc:399

kaldi::AccumulateMultiThreadedClass::dest_accum_
AccumDiagGmm * dest_accum_
Definition: mle-diag-gmm.cc:531

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::TraceMatMat
Real TraceMatMat(const MatrixBase< Real > &A, const MatrixBase< Real > &B, MatrixTransposeType trans)
We need to declare this here as it will be a friend function.
Definition: kaldi-matrix.cc:2692

kaldi::DiagGmmNormal::vars_
Matrix< double > vars_
diagonal variance
Definition: diag-gmm-normal.h:68

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::DiagGmm::NumGauss
int32 NumGauss() const
Returns the number of mixture components in the GMM.
Definition: diag-gmm.h:72

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::MatrixBase::SetZero
void SetZero()
Sets matrix to zero.
Definition: kaldi-matrix.cc:1330

kaldi::MleDiagGmmOptions
Configuration variables like variance floor, minimum occupancy, etc.
Definition: mle-diag-gmm.h:38

kaldi::VectorBase::Scale
void Scale(Real alpha)
Multiplies all elements by this constant.
Definition: kaldi-vector.cc:963

kaldi::AccumDiagGmm::occupancy_
Vector< double > occupancy_
Definition: mle-diag-gmm.h:195

kaldi::AccumDiagGmm::Read
void Read(std::istream &in_stream, bool binary, bool add)
Definition: mle-diag-gmm.cc:33

kaldi::AccumDiagGmm::SmoothWithAccum
void SmoothWithAccum(BaseFloat tau, const AccumDiagGmm &src_acc)
Smooths the accumulated counts using some other accumulator.
Definition: mle-diag-gmm.cc:225

kaldi::AccumDiagGmm::SetZero
void SetZero(GmmFlagsType flags)
Definition: mle-diag-gmm.cc:122

kaldi::AccumulateMultiThreadedClass::~AccumulateMultiThreadedClass
~AccumulateMultiThreadedClass()
Definition: mle-diag-gmm.cc:520

kaldi::AccumulateMultiThreadedClass::AccumulateMultiThreadedClass
AccumulateMultiThreadedClass(const DiagGmm &diag_gmm, const MatrixBase< BaseFloat > &data, const VectorBase< BaseFloat > &frame_weights, AccumDiagGmm *accum, double *tot_like)
Definition: mle-diag-gmm.cc:488

kaldi::AccumDiagGmm::Dim
int32 Dim() const
Returns the dimensionality of the feature vectors.
Definition: mle-diag-gmm.h:126

kaldi::MatrixBase::MulRowsVec
void MulRowsVec(const VectorBase< Real > &scale)
Equivalent to (*this) = diag(scale) * (*this).
Definition: kaldi-matrix.cc:1224

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::MleDiagGmmOptions::variance_floor_vector
Vector< double > variance_floor_vector
Variance floor for each dimension [empty if not supplied].
Definition: mle-diag-gmm.h:41

kaldi::MleDiagGmmOptions::min_gaussian_weight
BaseFloat min_gaussian_weight
Minimum weight below which a Gaussian is not updated (and is removed, if remove_low_count_gaussians =...
Definition: mle-diag-gmm.h:44

kaldi::DiagGmmNormal::means_
Matrix< double > means_
Means.
Definition: diag-gmm-normal.h:67

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::VectorBase::InvertElements
void InvertElements()
Invert all elements.
Definition: kaldi-vector.cc:776

kaldi::AccumDiagGmm::variance_accumulator_
Matrix< double > variance_accumulator_
Definition: mle-diag-gmm.h:197

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::VectorBase::ApplyPow
void ApplyPow(Real power)
Take all elements of vector to a power.
Definition: kaldi-vector.h:179

kaldi::MultiThreadable
Definition: kaldi-thread.h:67

kaldi::MatrixBase::AddVecVec
void AddVecVec(const Real alpha, const VectorBase< OtherReal > &a, const VectorBase< OtherReal > &b)
*this += alpha * a * b^T
Definition: kaldi-matrix.cc:129

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::MatrixBase::CopyRowFromVec
void CopyRowFromVec(const VectorBase< Real > &v, const MatrixIndexT row)
Copy vector into specific row of matrix.
Definition: kaldi-matrix.cc:1081

kaldi::DiagGmm
Definition for Gaussian Mixture Model with diagonal covariances.
Definition: diag-gmm.h:42

kaldi::GmmFlagsToString
std::string GmmFlagsToString(GmmFlagsType flags)
Convert GMM flags to string.
Definition: model-common.cc:43

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::AccumulateMultiThreadedClass::frame_weights_
const VectorBase< BaseFloat > & frame_weights_
Definition: mle-diag-gmm.cc:530

kaldi::kGmmWeights
Definition: model-common.h:31

kaldi::AccumulateMultiThreadedClass::tot_like_
double tot_like_
Definition: mle-diag-gmm.cc:534

kaldi::DiagGmmNormal::weights_
Vector< double > weights_
weights (not log).
Definition: diag-gmm-normal.h:66

kaldi::AccumulateMultiThreadedClass::AccumulateMultiThreadedClass
AccumulateMultiThreadedClass(const AccumulateMultiThreadedClass &other)
Definition: mle-diag-gmm.cc:496

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::VectorBase::Add
void Add(Real c)
Add a constant to each element of a vector.
Definition: kaldi-vector.cc:956

kaldi::VectorBase::SetZero
void SetZero()
Set vector to all zeros.
Definition: kaldi-vector.cc:288

kaldi::AccumDiagGmm::Resize
void Resize(int32 num_gauss, int32 dim, GmmFlagsType flags)
Allocates memory for accumulators.
Definition: mle-diag-gmm.cc:106

kaldi::VecVec
Real VecVec(const VectorBase< Real > &a, const VectorBase< Real > &b)
Returns dot product between v1 and v2.
Definition: kaldi-vector.cc:37

kaldi::VectorBase::AddVec
void AddVec(const Real alpha, const VectorBase< OtherReal > &v)
Add vector : *this = *this + alpha * rv (with casting between floats and doubles) ...
Definition: kaldi-vector.cc:1044

kaldi::AccumDiagGmm::AccumulateFromPosteriors
void AccumulateFromPosteriors(const VectorBase< BaseFloat > &data, const VectorBase< BaseFloat > &gauss_posteriors)
Accumulate for all components, given the posteriors.
Definition: mle-diag-gmm.cc:171

kaldi::AccumulateMultiThreadedClass::accum_
AccumDiagGmm accum_
Definition: mle-diag-gmm.cc:532

kaldi::MapDiagGmmOptions::variance_tau
BaseFloat variance_tau
Tau value for the variances.
Definition: mle-diag-gmm.h:83

kaldi::Vector::Read
void Read(std::istream &in, bool binary, bool add=false)
Read function using C++ streams.
Definition: kaldi-vector.cc:1109

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501

kaldi::MapDiagGmmOptions::mean_tau
BaseFloat mean_tau
Tau value for the means.
Definition: mle-diag-gmm.h:78

kaldi::AccumDiagGmm::AssertEqual
void AssertEqual(const AccumDiagGmm &other)
Definition: mle-diag-gmm.cc:558

rnnlm::d
double d
Definition: mikolov-rnnlm-lib.cc:64

kaldi::AccumDiagGmm::AccumDiagGmm
AccumDiagGmm()
Definition: mle-diag-gmm.h:108

kaldi::AccumDiagGmm::NumGauss
int32 NumGauss() const
Returns the number of mixture components.
Definition: mle-diag-gmm.h:124

kaldi::MapDiagGmmOptions
Configuration variables for Maximum A Posteriori (MAP) update.
Definition: mle-diag-gmm.h:76

kaldi::AccumulateMultiThreadedClass::tot_like_ptr_
double * tot_like_ptr_
Definition: mle-diag-gmm.cc:533

kaldi::DiagGmm::inv_vars
const Matrix< BaseFloat > & inv_vars() const
Definition: diag-gmm.h:180

kaldi::DiagGmmNormal::CopyToDiagGmm
void CopyToDiagGmm(DiagGmm *diaggmm, GmmFlagsType flags=kGmmAll) const
Copies to DiagGmm the requested parameters.
Definition: diag-gmm-normal.cc:57