doc/lda-estimate_8cc_source.html

 // transform/lda-estimate.cc

 // Copyright 2009-2011  Jan Silovsky
 //                2013  Johns Hopkins University

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #include "transform/lda-estimate.h"

 namespace kaldi {

 void LdaEstimate::Init(int32 num_classes, int32 dimension) {
   zero_acc_.Resize(num_classes);
   first_acc_.Resize(num_classes, dimension);
   total_second_acc_.Resize(dimension);
 }

 void LdaEstimate::ZeroAccumulators() {
   zero_acc_.SetZero();
   first_acc_.SetZero();
   total_second_acc_.SetZero();
 }

 void LdaEstimate::Scale(BaseFloat f) {
   double d = static_cast<double>(f);
   zero_acc_.Scale(d);
   first_acc_.Scale(d);
   total_second_acc_.Scale(d);
 }

 void LdaEstimate::Accumulate(const VectorBase<BaseFloat> &data,
                              int32 class_id, BaseFloat weight) {
   KALDI_ASSERT(class_id >= 0);
   KALDI_ASSERT(class_id < NumClasses() && data.Dim() == Dim());

   Vector<double> data_d(data);

   zero_acc_(class_id) += weight;
   first_acc_.Row(class_id).AddVec(weight, data_d);
   total_second_acc_.AddVec2(weight, data_d);
 }

 void LdaEstimate::GetStats(SpMatrix<double> *total_covar,
                            SpMatrix<double> *between_covar,
                            Vector<double> *total_mean,
                            double *tot_count) const {
   int32 num_class = NumClasses(), dim = Dim();
   double sum = zero_acc_.Sum();
   *tot_count = sum;
   total_covar->Resize(dim);
   total_covar->CopyFromSp(total_second_acc_);
   total_mean->Resize(dim);
   total_mean->AddRowSumMat(1.0, first_acc_);
   total_mean->Scale(1.0 / sum);
   total_covar->Scale(1.0 / sum);
   total_covar->AddVec2(-1.0, *total_mean);

   between_covar->Resize(dim);
   Vector<double> class_mean(dim);
   for (int32 c = 0; c < num_class; c++) {
     if (zero_acc_(c) != 0.0) {
       class_mean.CopyRowFromMat(first_acc_, c);
       class_mean.Scale(1.0 / zero_acc_(c));
       between_covar->AddVec2(zero_acc_(c) / sum, class_mean);
     }
   }
   between_covar->AddVec2(-1.0, *total_mean);
 }


 void LdaEstimate::Estimate(const LdaEstimateOptions &opts,
                            Matrix<BaseFloat> *m,
                            Matrix<BaseFloat> *mfull) const {
   int32 target_dim = opts.dim;
   KALDI_ASSERT(target_dim > 0);
   // between-class covar is of most rank C-1
   KALDI_ASSERT(target_dim <= Dim() && (target_dim < NumClasses() || opts.allow_large_dim));
   int32 dim = Dim();

   double count;
   SpMatrix<double> total_covar, bc_covar;
   Vector<double> total_mean;
   GetStats(&total_covar, &bc_covar, &total_mean, &count);

   // within-class covariance
   SpMatrix<double> wc_covar(total_covar);
   wc_covar.AddSp(-1.0, bc_covar);
   TpMatrix<double> wc_covar_sqrt(dim);
   try {
     wc_covar_sqrt.Cholesky(wc_covar);
   } catch (...) {
     BaseFloat smooth = 1.0e-03 * wc_covar.Trace() / wc_covar.NumRows();
     KALDI_LOG << "Cholesky failed (possibly not +ve definite), so adding " << smooth
               << " to diagonal and trying again.\n";
     for (int32 i = 0; i < wc_covar.NumRows(); i++)
       wc_covar(i, i) += smooth;
     wc_covar_sqrt.Cholesky(wc_covar);
   }
   Matrix<double> wc_covar_sqrt_mat(wc_covar_sqrt);
   // copy wc_covar_sqrt to Matrix, because it facilitates further use
   wc_covar_sqrt_mat.Invert();

   SpMatrix<double> tmp_sp(dim);
   tmp_sp.AddMat2Sp(1.0, wc_covar_sqrt_mat, kNoTrans, bc_covar, 0.0);
   Matrix<double> tmp_mat(tmp_sp);

   Matrix<double> svd_u(dim, dim), svd_vt(dim, dim);
   Vector<double> svd_d(dim);
   tmp_mat.Svd(&svd_d, &svd_u, &svd_vt);
   SortSvd(&svd_d, &svd_u);

   KALDI_LOG << "Data count is " << count;
   KALDI_LOG << "LDA singular values are " << svd_d;

   KALDI_LOG << "Sum of all singular values is " << svd_d.Sum();
   KALDI_LOG << "Sum of selected singular values is " <<
       SubVector<double>(svd_d, 0, target_dim).Sum();

   Matrix<double> lda_mat(dim, dim);
   lda_mat.AddMatMat(1.0, svd_u, kTrans, wc_covar_sqrt_mat, kNoTrans, 0.0);

   // finally, copy first target_dim rows to m
   m->Resize(target_dim, dim);
   m->CopyFromMat(lda_mat.Range(0, target_dim, 0, dim));

   if (mfull != NULL) {
     mfull->Resize(dim, dim);
     mfull->CopyFromMat(lda_mat);
   }

   if (opts.within_class_factor != 1.0) { // This is not the normal code path;
     // it's intended for use in neural net inputs.
     for (int32 i = 0; i < svd_d.Dim(); i++) {
       BaseFloat old_var = 1.0 + svd_d(i), // the total variance of that dim..
           new_var = opts.within_class_factor + svd_d(i), // the variance we want..
           scale = sqrt(new_var / old_var);
       if (i < m->NumRows())
         m->Row(i).Scale(scale);
       if (mfull != NULL)
         mfull->Row(i).Scale(scale);
     }
   }

   if (opts.remove_offset) {
     AddMeanOffset(total_mean, m);
     if (mfull != NULL)
       AddMeanOffset(total_mean, mfull);
   }
 }

 // static
 void LdaEstimate::AddMeanOffset(const VectorBase<double> &mean_dbl,
                                 Matrix<BaseFloat> *projection) {
   Vector<BaseFloat> mean(mean_dbl);
   Vector<BaseFloat> neg_projected_mean(projection->NumRows());
   // the negative
   neg_projected_mean.AddMatVec(-1.0, *projection, kNoTrans, mean, 0.0);
   projection->Resize(projection->NumRows(),
                      projection->NumCols() + 1,
                      kCopyData);
   projection->CopyColFromVec(neg_projected_mean, projection->NumCols() - 1);
 }


 void LdaEstimate::Read(std::istream &in_stream, bool binary, bool add) {
   int32 num_classes, dim;
   std::string token;

   ExpectToken(in_stream, binary, "<LDAACCS>");
   ExpectToken(in_stream, binary, "<VECSIZE>");
   ReadBasicType(in_stream, binary, &dim);
   ExpectToken(in_stream, binary, "<NUMCLASSES>");
   ReadBasicType(in_stream, binary, &num_classes);

   if (add) {
     if (NumClasses() != 0 || Dim() != 0) {
       if (num_classes != NumClasses() || dim != Dim()) {
         KALDI_ERR <<"LdaEstimate::Read, dimension or classes count mismatch, "
                   <<(NumClasses()) << ", " <<(Dim()) << ", "
                   << " vs. " <<(num_classes) << ", " << (dim);
       }
     } else {
       Init(num_classes, dim);
     }
   } else {
     Init(num_classes, dim);
   }

   // these are needed for demangling the variances.
   Vector<double> tmp_zero_acc;
   Matrix<double> tmp_first_acc;
   SpMatrix<double> tmp_sec_acc;

   ReadToken(in_stream, binary, &token);
   while (token != "</LDAACCS>") {
     if (token == "<ZERO_ACCS>") {
       tmp_zero_acc.Read(in_stream, binary, false);
       if (!add) zero_acc_.SetZero();
       zero_acc_.AddVec(1.0, tmp_zero_acc);
       // zero_acc_.Read(in_stream, binary, add);
     } else if (token == "<FIRST_ACCS>") {
       tmp_first_acc.Read(in_stream, binary, false);
       if (!add) first_acc_.SetZero();
       first_acc_.AddMat(1.0, tmp_first_acc);
       // first_acc_.Read(in_stream, binary, add);
     } else if (token == "<SECOND_ACCS>") {
       tmp_sec_acc.Read(in_stream, binary, false);
       for (int32 c = 0; c < static_cast<int32>(NumClasses()); c++) {
         if (tmp_zero_acc(c) != 0)
           tmp_sec_acc.AddVec2(1.0 / tmp_zero_acc(c), tmp_first_acc.Row(c));
       }
       if (!add) total_second_acc_.SetZero();
       total_second_acc_.AddSp(1.0, tmp_sec_acc);
       // total_second_acc_.Read(in_stream, binary, add);
     } else {
       KALDI_ERR << "Unexpected token '" << token << "' in file ";
     }
     ReadToken(in_stream, binary, &token);
   }
 }

 void LdaEstimate::Write(std::ostream &out_stream, bool binary) const {
   WriteToken(out_stream, binary, "<LDAACCS>");
   WriteToken(out_stream, binary, "<VECSIZE>");
   WriteBasicType(out_stream, binary, static_cast<int32>(Dim()));
   WriteToken(out_stream, binary, "<NUMCLASSES>");
   WriteBasicType(out_stream, binary, static_cast<int32>(NumClasses()));

   WriteToken(out_stream, binary, "<ZERO_ACCS>");
   Vector<BaseFloat> zero_acc_bf(zero_acc_);
   zero_acc_bf.Write(out_stream, binary);
   WriteToken(out_stream, binary, "<FIRST_ACCS>");
   Matrix<BaseFloat> first_acc_bf(first_acc_);
   first_acc_bf.Write(out_stream, binary);
   WriteToken(out_stream, binary, "<SECOND_ACCS>");
   SpMatrix<double> tmp_sec_acc(total_second_acc_);
   for (int32 c = 0; c < static_cast<int32>(NumClasses()); c++) {
     if (zero_acc_(c) != 0)
       tmp_sec_acc.AddVec2(-1.0 / zero_acc_(c), first_acc_.Row(c));
   }
   SpMatrix<BaseFloat> tmp_sec_acc_bf(tmp_sec_acc);
   tmp_sec_acc_bf.Write(out_stream, binary);

   WriteToken(out_stream, binary, "</LDAACCS>");
 }


 }  // End of namespace kaldi
kaldi::LdaEstimate::Accumulate
void Accumulate(const VectorBase< BaseFloat > &data, int32 class_id, BaseFloat weight=1.0)
Accumulates data.
Definition: lda-estimate.cc:45

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::SpMatrix< double >

kaldi::MatrixBase::Write
void Write(std::ostream &out, bool binary) const
write to stream.
Definition: kaldi-matrix.cc:1379

kaldi::MatrixBase::CopyColFromVec
void CopyColFromVec(const VectorBase< Real > &v, const MatrixIndexT col)
Copy vector into specific column of matrix.
Definition: kaldi-matrix.cc:1102

kaldi::PackedMatrix::Scale
void Scale(Real c)
Definition: packed-matrix.cc:33

kaldi::PackedMatrix::Read
void Read(std::istream &in, bool binary, bool add=false)
Definition: packed-matrix.cc:298

kaldi::VectorBase::AddRowSumMat
void AddRowSumMat(Real alpha, const MatrixBase< Real > &M, Real beta=1.0)
Does *this = alpha * (sum of rows of M) + beta * *this.
Definition: kaldi-vector.cc:714

kaldi::PackedMatrix::Write
void Write(std::ostream &out, bool binary) const
Definition: packed-matrix.cc:236

kaldi::LdaEstimateOptions::allow_large_dim
bool allow_large_dim
Definition: lda-estimate.h:32

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::LdaEstimate::Dim
int32 Dim() const
Returns the dimensionality of the feature vectors.
Definition: lda-estimate.h:66

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::SpMatrix::Trace
Real Trace() const
Definition: sp-matrix.cc:171

kaldi::PackedMatrix::SetZero
void SetZero()
Definition: packed-matrix.cc:207

kaldi::VectorBase::Write
void Write(std::ostream &Out, bool binary) const
Writes to C++ stream (option to write in binary).
Definition: kaldi-vector.cc:1231

kaldi::LdaEstimateOptions::remove_offset
bool remove_offset
Definition: lda-estimate.h:30

kaldi::LdaEstimate::Scale
void Scale(BaseFloat f)
Scales all accumulators.
Definition: lda-estimate.cc:38

kaldi::LdaEstimate::first_acc_
Matrix< double > first_acc_
Definition: lda-estimate.h:94

kaldi::LdaEstimate::Write
void Write(std::ostream &out_stream, bool binary) const
Definition: lda-estimate.cc:237

kaldi::MatrixBase::AddMat
void AddMat(const Real alpha, const MatrixBase< Real > &M, MatrixTransposeType transA=kNoTrans)
*this += alpha * M [or M^T]
Definition: kaldi-matrix.cc:356

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::Matrix< BaseFloat >

kaldi::Vector::Resize
void Resize(MatrixIndexT length, MatrixResizeType resize_type=kSetZero)
Set vector to a specified size (can be zero).
Definition: kaldi-vector.cc:190

kaldi::LdaEstimate::Init
void Init(int32 num_classes, int32 dimension)
Allocates memory for accumulators.
Definition: lda-estimate.cc:26

kaldi::MatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &M, MatrixTransposeType trans=kNoTrans)
Copy given matrix. (no resize is done).
Definition: kaldi-matrix.cc:862

kaldi::PackedMatrix::NumRows
MatrixIndexT NumRows() const
Definition: packed-matrix.h:104

kaldi::LdaEstimate::zero_acc_
Vector< double > zero_acc_
Definition: lda-estimate.h:93

kaldi::SpMatrix::CopyFromSp
void CopyFromSp(const SpMatrix< Real > &other)
Definition: sp-matrix.h:85

kaldi::VectorBase::CopyRowFromMat
void CopyRowFromMat(const MatrixBase< Real > &M, MatrixIndexT row)
Extracts a row of the matrix M.
Definition: kaldi-vector.cc:407

kaldi::kTrans
Definition: matrix-common.h:33

count
const size_t count
Definition: arpa-file-parser-test.cc:66

kaldi::SpMatrix::AddVec2
void AddVec2(const Real alpha, const VectorBase< OtherReal > &v)
rank-one update, this <– this + alpha v v&#39;
Definition: sp-matrix.cc:946

kaldi::Matrix::Read
void Read(std::istream &in, bool binary, bool add=false)
read from stream.
Definition: kaldi-matrix.cc:1450

kaldi::TpMatrix::Cholesky
void Cholesky(const SpMatrix< Real > &orig)
Definition: tp-matrix.cc:88

kaldi::LdaEstimate::Estimate
void Estimate(const LdaEstimateOptions &opts, Matrix< BaseFloat > *M, Matrix< BaseFloat > *Mfull=NULL) const
Estimates the LDA transform matrix m.
Definition: lda-estimate.cc:85

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

float

lda-estimate.h

kaldi::LdaEstimate::Read
void Read(std::istream &in_stream, bool binary, bool add)
Definition: lda-estimate.cc:180

kaldi::MatrixBase::Scale
void Scale(Real alpha)
Multiply each element with a scalar value.
Definition: kaldi-matrix.cc:1209

kaldi::SpMatrix::AddSp
void AddSp(const Real alpha, const SpMatrix< Real > &Ma)
Definition: sp-matrix.h:211

kaldi::LdaEstimateOptions::dim
int32 dim
Definition: lda-estimate.h:31

kaldi::ExpectToken
void ExpectToken(std::istream &is, bool binary, const char *token)
ExpectToken tries to read in the given token, and throws an exception on failure. ...
Definition: io-funcs.cc:191

kaldi::LdaEstimate::AddMeanOffset
static void AddMeanOffset(const VectorBase< double > &total_mean, Matrix< BaseFloat > *projection)
This function modifies the LDA matrix so that it also subtracts the mean feature value.
Definition: lda-estimate.cc:166

kaldi::MatrixBase::AddMatMat
void AddMatMat(const Real alpha, const MatrixBase< Real > &A, MatrixTransposeType transA, const MatrixBase< Real > &B, MatrixTransposeType transB, const Real beta)
Definition: kaldi-matrix.cc:171

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::TpMatrix< double >

kaldi::LdaEstimateOptions::within_class_factor
BaseFloat within_class_factor
Definition: lda-estimate.h:33

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::MatrixBase::SetZero
void SetZero()
Sets matrix to zero.
Definition: kaldi-matrix.cc:1330

kaldi::VectorBase::Scale
void Scale(Real alpha)
Multiplies all elements by this constant.
Definition: kaldi-vector.cc:963

kaldi::VectorBase::AddMatVec
void AddMatVec(const Real alpha, const MatrixBase< Real > &M, const MatrixTransposeType trans, const VectorBase< Real > &v, const Real beta)
Add matrix times vector : this <– beta*this + alpha*M*v.
Definition: kaldi-vector.cc:92

kaldi::LdaEstimate::NumClasses
int32 NumClasses() const
Returns the number of classes.
Definition: lda-estimate.h:64

kaldi::LdaEstimate::GetStats
void GetStats(SpMatrix< double > *total_covar, SpMatrix< double > *between_covar, Vector< double > *total_mean, double *sum) const
Extract a more processed form of the stats.
Definition: lda-estimate.cc:57

kaldi::kCopyData
Definition: matrix-common.h:40

kaldi::VectorBase::Sum
Real Sum() const
Returns sum of the elements.
Definition: kaldi-vector.cc:688

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::Vector< double >

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::SpMatrix::AddMat2Sp
void AddMat2Sp(const Real alpha, const MatrixBase< Real > &M, MatrixTransposeType transM, const SpMatrix< Real > &A, const Real beta=0.0)
Extension of rank-N update: this <– beta*this + alpha * M * A * M^T.
Definition: sp-matrix.cc:982

kaldi::LdaEstimate::total_second_acc_
SpMatrix< double > total_second_acc_
Definition: lda-estimate.h:95

kaldi::MatrixBase::Range
SubMatrix< Real > Range(const MatrixIndexT row_offset, const MatrixIndexT num_rows, const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Return a sub-part of matrix.
Definition: kaldi-matrix.h:202

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::MatrixBase::Svd
void Svd(VectorBase< Real > *s, MatrixBase< Real > *U, MatrixBase< Real > *Vt) const
Compute SVD (*this) = U diag(s) Vt.
Definition: kaldi-matrix.cc:1825

kaldi::LdaEstimate::ZeroAccumulators
void ZeroAccumulators()
Sets all accumulators to zero.
Definition: lda-estimate.cc:32

kaldi::SpMatrix::Resize
void Resize(MatrixIndexT nRows, MatrixResizeType resize_type=kSetZero)
Definition: sp-matrix.h:81

kaldi::MatrixBase::Invert
void Invert(Real *log_det=NULL, Real *det_sign=NULL, bool inverse_needed=true)
matrix inverse.
Definition: kaldi-matrix.cc:38

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::LdaEstimateOptions
Definition: lda-estimate.h:29

kaldi::VectorBase::SetZero
void SetZero()
Set vector to all zeros.
Definition: kaldi-vector.cc:288

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::VectorBase::AddVec
void AddVec(const Real alpha, const VectorBase< OtherReal > &v)
Add vector : *this = *this + alpha * rv (with casting between floats and doubles) ...
Definition: kaldi-vector.cc:1044

kaldi::Vector::Read
void Read(std::istream &in, bool binary, bool add=false)
Read function using C++ streams.
Definition: kaldi-vector.cc:1109

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501

kaldi::SortSvd
void SortSvd(VectorBase< Real > *s, MatrixBase< Real > *U, MatrixBase< Real > *Vt, bool sort_on_absolute_value)
Function to ensure that SVD is sorted.
Definition: kaldi-matrix.cc:2580

rnnlm::d
double d
Definition: mikolov-rnnlm-lib.cc:64