doc/nnet-kl-hmm_8h_source.html

 // nnet/nnet-kl-hmm.h

 // Copyright 2013  Idiap Research Institute (Author: David Imseng)
 //                 Karlsruhe Institute of Technology (Author: Ngoc Thang Vu)
 //                 Brno University of Technology (Author: Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_NNET_NNET_KL_HMM_H_
 #define KALDI_NNET_NNET_KL_HMM_H_

 #include <vector>

 #include "nnet/nnet-component.h"
 #include "cudamatrix/cu-math.h"
 #include "cudamatrix/cu-rand.h"
 #include "matrix/kaldi-vector.h"
 #include "matrix/kaldi-matrix.h"

 namespace kaldi {
 namespace nnet1 {

 class KlHmm : public Component {
  public:
   KlHmm(int32 dim_in, int32 dim_out):
     Component(dim_in, dim_out),
     kl_stats_(dim_out, dim_in, kSetZero)
   { }

   ~KlHmm()
   { }

   Component* Copy() const { return new KlHmm(*this); }
   ComponentType GetType() const { return kKlHmm; }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     if (kl_inv_q_.NumRows() == 0) {
       // Copy the CudaMatrix to a Matrix
       Matrix<BaseFloat> in_tmp(in.NumRows(), in.NumCols());
       in.CopyToMat(&in_tmp);
       // Check if there are posteriors in the Matrix (check on first row),
       BaseFloat post_sum = in_tmp.Row(0).Sum();
       KALDI_ASSERT(ApproxEqual(post_sum, 1.0));
       // Get a tmp Matrix of the stats
       Matrix<BaseFloat> kl_stats_tmp(kl_stats_);
       // Init a vector to get the sum of the rows (for normalization)
       Vector<BaseFloat> row_sum(kl_stats_.NumRows(), kSetZero);
       // Get the sum of the posteriors for normalization
       row_sum.AddColSumMat(1, kl_stats_tmp);
       // Apply floor to make sure there is no zero
       row_sum.ApplyFloor(1e-20);
       // Invert the sum (to normalize)
       row_sum.InvertElements();
       // Normalizing the statistics vector
       kl_stats_tmp.MulRowsVec(row_sum);
       // Apply floor before inversion and logarithm
       kl_stats_tmp.ApplyFloor(1e-20);
       // Apply invesion
       kl_stats_tmp.InvertElements();
       // Apply logarithm
       kl_stats_tmp.ApplyLog();
       // Inverted and logged values
       kl_inv_q_.Resize(kl_stats_.NumRows(), kl_stats_.NumCols());
       // Holds now log (1/Q)
       kl_inv_q_.CopyFromMat(kl_stats_tmp);
     }
     // Get the logarithm of the features for the Entropy calculation
     // Copy the CudaMatrix to a Matrix
     Matrix<BaseFloat> in_log_tmp(in.NumRows(), in.NumCols());
     in.CopyToMat(&in_log_tmp);
     // Flooring and log
     in_log_tmp.ApplyFloor(1e-20);
     in_log_tmp.ApplyLog();
     CuMatrix<BaseFloat> log_in(in.NumRows(), in.NumCols());
     log_in.CopyFromMat(in_log_tmp);
     // P*logP
     CuMatrix<BaseFloat> tmp_entropy(in);
     tmp_entropy.MulElements(log_in);
     // Getting the entropy (sum P*logP)
     CuVector<BaseFloat> in_entropy(in.NumRows(), kSetZero);
     in_entropy.AddColSumMat(1, tmp_entropy);
     // sum P*log (1/Q)
     out->AddMatMat(1, in, kNoTrans, kl_inv_q_, kTrans, 0);
     // (sum P*logP) + (sum P*log(1/Q)
     out->AddVecToCols(1, in_entropy);
     // return the negative KL-divergence
     out->Scale(-1);
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     KALDI_ERR << "Unimplemented";
   }

   void ReadData(std::istream &is, bool binary) {
     kl_stats_.Read(is, binary);
     KALDI_ASSERT(kl_stats_.NumRows() == output_dim_);
     KALDI_ASSERT(kl_stats_.NumCols() == input_dim_);
   }

   void WriteData(std::ostream &os, bool binary) const {
     kl_stats_.Write(os, binary);
   }

   void SetStats(const Matrix<BaseFloat> mat) {
     KALDI_ASSERT(mat.NumRows() == output_dim_);
     KALDI_ASSERT(mat.NumCols() == input_dim_);
     kl_stats_.Resize(mat.NumRows(), mat.NumCols());
     kl_stats_.CopyFromMat(mat);
   }

   void Accumulate(const Matrix<BaseFloat> &posteriors,
                   const std::vector<int32> &alignment) {
     KALDI_ASSERT(posteriors.NumRows() == alignment.size());
     KALDI_ASSERT(posteriors.NumCols() == kl_stats_.NumCols());
     int32 num_frames = alignment.size();
     for (int32 i = 0; i < num_frames; i++) {
       // Casting float posterior to double (fixing numerical issue),
       Vector<double> temp(posteriors.Row(i));
       // Sum the postiors grouped by states from the alignment,
       kl_stats_.Row(alignment[i]).AddVec(1, temp);
     }
   }

  private:
   Matrix<double> kl_stats_;
   CuMatrix<BaseFloat> kl_inv_q_;
 };

 }  // namespace nnet1
 }  // namespace kaldi

 #endif  // KALDI_NNET_NNET_KL_HMM_H_

kaldi::MatrixBase::ApplyLog
void ApplyLog()
Definition: kaldi-matrix.h:374

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::KlHmm::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-kl-hmm.h:50

cu-rand.h

kaldi::MatrixBase::Write
void Write(std::ostream &out, bool binary) const
write to stream.
Definition: kaldi-matrix.cc:1379

kaldi::nnet1::KlHmm::SetStats
void SetStats(const Matrix< BaseFloat > mat)
Set the statistics matrix.
Definition: nnet-kl-hmm.h:125

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::nnet1::Component::input_dim_
int32 input_dim_
Data members,.
Definition: nnet-component.h:190

kaldi::CuMatrixBase::CopyToMat
void CopyToMat(MatrixBase< OtherReal > *dst, MatrixTransposeType trans=kNoTrans) const
Definition: cu-matrix.cc:447

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi-matrix.h

kaldi::nnet1::KlHmm::kl_inv_q_
CuMatrix< BaseFloat > kl_inv_q_
Definition: nnet-kl-hmm.h:148

kaldi::CuMatrixBase::AddVecToCols
void AddVecToCols(Real alpha, const CuVectorBase< Real > &col, Real beta=1.0)
(for each column c of *this), c = alpha * col + beta * c
Definition: cu-matrix.cc:1232

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::Matrix< BaseFloat >

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

nnet-component.h

kaldi::MatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &M, MatrixTransposeType trans=kNoTrans)
Copy given matrix. (no resize is done).
Definition: kaldi-matrix.cc:862

kaldi::nnet1::KlHmm::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-kl-hmm.h:48

kaldi::nnet1::Component::ComponentType
ComponentType
Component type identification mechanism,.
Definition: nnet-component.h:47

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::nnet1::KlHmm::ReadData
void ReadData(std::istream &is, bool binary)
Reads the component content.
Definition: nnet-kl-hmm.h:113

kaldi::CuMatrixBase::Scale
void Scale(Real value)
Definition: cu-matrix.cc:644

kaldi::Matrix::Read
void Read(std::istream &in, bool binary, bool add=false)
read from stream.
Definition: kaldi-matrix.cc:1450

kaldi::nnet1::KlHmm::~KlHmm
~KlHmm()
Definition: nnet-kl-hmm.h:44

kaldi::MatrixBase::Row
const SubVector< Real > Row(MatrixIndexT i) const
Return specific row of matrix [const].
Definition: kaldi-matrix.h:188

kaldi::nnet1::Component::kKlHmm
Definition: nnet-component.h:77

float

kaldi::CuVectorBase::AddColSumMat
void AddColSumMat(Real alpha, const CuMatrixBase< Real > &mat, Real beta=1.0)
Sum the columns of the matrix, add to vector.
Definition: cu-vector.cc:1298

kaldi-vector.h

kaldi::CuMatrixBase::MulElements
void MulElements(const CuMatrixBase< Real > &A)
Multiply two matrices elementwise: C = C .* A.
Definition: cu-matrix.cc:667

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::nnet1::KlHmm::Accumulate
void Accumulate(const Matrix< BaseFloat > &posteriors, const std::vector< int32 > &alignment)
Accumulate the statistics for KL-HMM paramter estimation,.
Definition: nnet-kl-hmm.h:133

kaldi::CuMatrixBase::AddMatMat
void AddMatMat(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType transA, const CuMatrixBase< Real > &B, MatrixTransposeType transB, Real beta)
C = alpha * A(^T)*B(^T) + beta * C.
Definition: cu-matrix.cc:1291

kaldi::nnet1::KlHmm
Definition: nnet-kl-hmm.h:37

kaldi::nnet1::Component::output_dim_
int32 output_dim_
Dimension of the output of the Component,.
Definition: nnet-component.h:191

kaldi::MatrixBase::MulRowsVec
void MulRowsVec(const VectorBase< Real > &scale)
Equivalent to (*this) = diag(scale) * (*this).
Definition: kaldi-matrix.cc:1224

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

cu-math.h

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::MatrixBase::InvertElements
void InvertElements()
Inverts all the elements of the matrix.
Definition: kaldi-matrix.cc:2070

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::kSetZero
Definition: matrix-common.h:38

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet1::KlHmm::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-kl-hmm.h:105

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::nnet1::Component
Abstract class, building block of the network.
Definition: nnet-component.cc:51

kaldi::nnet1::KlHmm::KlHmm
KlHmm(int32 dim_in, int32 dim_out)
Definition: nnet-kl-hmm.h:39

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::VectorBase::AddColSumMat
void AddColSumMat(Real alpha, const MatrixBase< Real > &M, Real beta=1.0)
Does *this = alpha * (sum of columns of M) + beta * *this.
Definition: kaldi-vector.cc:734

kaldi::MatrixBase::ApplyFloor
void ApplyFloor(Real floor_val)
Definition: kaldi-matrix.h:354

kaldi::ApproxEqual
static bool ApproxEqual(float a, float b, float relative_tolerance=0.001)
return abs(a - b) <= relative_tolerance * (abs(a)+abs(b)).
Definition: kaldi-math.h:265

kaldi::nnet1::KlHmm::WriteData
void WriteData(std::ostream &os, bool binary) const
Writes the component content.
Definition: nnet-kl-hmm.h:120

kaldi::nnet1::KlHmm::kl_stats_
Matrix< double > kl_stats_
Definition: nnet-kl-hmm.h:147

kaldi::nnet1::KlHmm::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-kl-hmm.h:47