doc/nnet-utils_8h_source.html

 // nnet/nnet-utils.h

 // Copyright 2015  Brno University of Technology (author: Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_NNET_NNET_UTILS_H_
 #define KALDI_NNET_NNET_UTILS_H_

 #include <string>
 #include <vector>
 #include <iterator>
 #include <algorithm>

 #include "base/kaldi-common.h"
 #include "cudamatrix/cu-matrix.h"
 #include "cudamatrix/cu-array.h"
 #include "hmm/posterior.h"
 #include "hmm/transition-model.h"

 namespace kaldi {
 namespace nnet1 {


 template <typename T>
 std::ostream& operator<<(std::ostream& os, const std::vector<T>& v) {
   std::copy(v.begin(), v.end(), std::ostream_iterator<T>(os, " "));
   return os;
 }

 template <typename T>
 std::string ToString(const T& t) {
   std::ostringstream os;
   os << t;
   return os.str();
 }

 template <typename Real>
 std::string MomentStatistics(const VectorBase<Real> &vec) {
   // we use an auxiliary vector for the higher order powers
   Vector<Real> vec_aux(vec);
   Vector<Real> vec_no_mean(vec);  // vec with mean subtracted
   // mean
   Real mean = vec.Sum() / vec.Dim();
   // variance
   vec_aux.Add(-mean);
   vec_no_mean = vec_aux;
   vec_aux.MulElements(vec_no_mean);  // (vec-mean)^2
   Real variance = vec_aux.Sum() / vec.Dim();
   // skewness
   // - negative : left tail is longer,
   // - positive : right tail is longer,
   // - zero : symmetric
   vec_aux.MulElements(vec_no_mean);  // (vec-mean)^3
   Real skewness = vec_aux.Sum() / pow(variance, 3.0/2.0) / vec.Dim();
   // kurtosis (peakedness)
   // - makes sense for symmetric distributions (skewness is zero)
   // - positive : 'sharper peak' than Normal distribution
   // - negative : 'heavier tails' than Normal distribution
   // - zero : same peakedness as the Normal distribution
   vec_aux.MulElements(vec_no_mean);  // (vec-mean)^4
   Real kurtosis = vec_aux.Sum() / (variance * variance) / vec.Dim() - 3.0;
   // send the statistics to stream,
   std::ostringstream ostr;
   ostr << " ( min " << vec.Min() << ", max " << vec.Max()
        << ", mean " << mean
        << ", stddev " << sqrt(variance)
        << ", skewness " << skewness
        << ", kurtosis " << kurtosis
        << " ) ";
   return ostr.str();
 }

 template <typename Real>
 std::string MomentStatistics(const MatrixBase<Real> &mat) {
   Vector<Real> vec(mat.NumRows()*mat.NumCols());
   vec.CopyRowsFromMat(mat);
   return MomentStatistics(vec);
 }

 template <typename Real>
 std::string MomentStatistics(const CuVectorBase<Real> &vec) {
   Vector<Real> vec_host(vec.Dim());
   vec.CopyToVec(&vec_host);
   return MomentStatistics(vec_host);
 }

 template <typename Real>
 std::string MomentStatistics(const CuMatrixBase<Real> &mat) {
   Matrix<Real> mat_host(mat.NumRows(), mat.NumCols());
   mat.CopyToMat(&mat_host);
   return MomentStatistics(mat_host);
 }

 template <typename Real>
 void CheckNanInf(const CuMatrixBase<Real> &mat, const char *msg = "") {
   Real sum = mat.Sum();
   if (KALDI_ISINF(sum)) { KALDI_ERR << "'inf' in " << msg; }
   if (KALDI_ISNAN(sum)) { KALDI_ERR << "'nan' in " << msg; }
 }

 template <typename Real>
 Real ComputeStdDev(const CuMatrixBase<Real> &mat) {
   int32 N = mat.NumRows() * mat.NumCols();
   Real mean = mat.Sum() / N;
   CuMatrix<Real> pow_2(mat);
   pow_2.MulElements(mat);
   Real var = pow_2.Sum() / N - mean * mean;
   if (var < 0.0) {
     KALDI_WARN << "Forcing the variance to be non-negative! " << var << "->0.0";
     var = 0.0;
   }
   return sqrt(var);
 }


 template <typename Real>
 void RandGauss(BaseFloat mu, BaseFloat sigma, CuMatrixBase<Real>* mat,
                struct RandomState* state = NULL) {
   // fill temporary matrix with 'Normal' samples,
   Matrix<Real> m(mat->NumRows(), mat->NumCols(), kUndefined);
   for (int32 r = 0; r < m.NumRows(); r++) {
     for (int32 c = 0; c < m.NumCols(); c++) {
       m(r, c) = RandGauss(state);
     }
   }
   // re-shape the distrbution,
   m.Scale(sigma);
   m.Add(mu);
   // export,
   mat->CopyFromMat(m);
 }

 template <typename Real>
 void RandUniform(BaseFloat mu, BaseFloat range, CuMatrixBase<Real>* mat,
                  struct RandomState* state = NULL) {
   // fill temporary matrix with '0..1' samples,
   Matrix<Real> m(mat->NumRows(), mat->NumCols(), kUndefined);
   for (int32 r = 0; r < m.NumRows(); r++) {
     for (int32 c = 0; c < m.NumCols(); c++) {
       m(r, c) = Rand(state) / static_cast<Real>(RAND_MAX);
     }
   }
   // re-shape the distrbution,
   m.Scale(range);  // 0..range,
   m.Add(mu - (range / 2.0));  // mu-range/2 .. mu+range/2,
   // export,
   mat->CopyFromMat(m);
 }

 template <typename Real>
 void RandUniform(BaseFloat mu, BaseFloat range, CuVectorBase<Real>* vec,
                  struct RandomState* state = NULL) {
   // fill temporary vector with '0..1' samples,
   Vector<Real> v(vec->Dim(), kUndefined);
   for (int32 i = 0; i < v.Dim(); i++) {
     v(i) = Rand(state) / static_cast<Real>(RAND_MAX);
   }
   // re-shape the distrbution,
   v.Scale(range);  // 0..range,
   v.Add(mu - (range / 2.0));  // mu-range/2 .. mu+range/2,
   // export,
   vec->CopyFromVec(v);
 }


 inline void BuildIntegerVector(const std::vector<std::vector<int32> >& in,
                                std::vector<int32>* out) {
   // start with empty vector,
   out->clear();
   // loop over records,
   for (int32 i = 0; i < in.size(); i++) {
     // process i'th record,
     int32 beg = 0, end = 0, step = 1;
     switch (in[i].size()) {
       case 1:
         beg  = in[i][0];
         end  = in[i][0];
         step = 1;
         break;
       case 2:
         beg  = in[i][0];
         end  = in[i][1];
         step = 1;
         break;
       case 3:
         beg  = in[i][0];
         end  = in[i][2];
         step = in[i][1];
         break;
       default:
         KALDI_ERR << "Something is wrong! (should be 1-3) : "
                   << in[i].size();
     }
     // check the inputs,
     KALDI_ASSERT(beg <= end);
     KALDI_ASSERT(step > 0);  // positive,
     // append values to vector,
     for (int32 j = beg; j <= end; j += step) {
       out->push_back(j);
     }
   }
 }

 inline void BuildIntegerVector(const std::vector<std::vector<int32> >& in,
                                CuArray<int32>* out) {
   std::vector<int32> v;
   BuildIntegerVector(in, &v);
   (*out) = v;
 }


 template <typename Real>
 void PosteriorToMatrix(const Posterior &post,
                        const int32 post_dim, CuMatrix<Real> *mat) {
   Matrix<Real> m;
   PosteriorToMatrix(post, post_dim, &m);
   (*mat) = m;
 }


 template <typename Real>
 void PosteriorToPdfMatrix(const Posterior &post,
                           const TransitionModel &model,
                           CuMatrix<Real> *mat) {
   Matrix<BaseFloat> m;
   PosteriorToPdfMatrix(post, model, &m);
   // Copy to output GPU matrix,
   (*mat) = m;
 }


 }  // namespace nnet1
 }  // namespace kaldi

 #endif  // KALDI_NNET_NNET_UTILS_H_
kaldi::nnet1::ToString
std::string ToString(const T &t)
Convert basic type to a string (please don&#39;t overuse),.
Definition: nnet-utils.h:52

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::PosteriorToPdfMatrix
void PosteriorToPdfMatrix(const Posterior &post, const TransitionModel &model, CuMatrix< Real > *mat)
Wrapper of PosteriorToMatrixMapped with CuMatrix argument.
Definition: nnet-utils.h:304

kaldi::kUndefined
Definition: matrix-common.h:39

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet1::MomentStatistics
std::string MomentStatistics(const VectorBase< Real > &vec)
Get a string with statistics of the data in a vector, so we can print them easily.
Definition: nnet-utils.h:63

kaldi::CuMatrixBase::CopyToMat
void CopyToMat(MatrixBase< OtherReal > *dst, MatrixTransposeType trans=kNoTrans) const
Definition: cu-matrix.cc:447

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::MatrixBase
Base class which provides matrix operations not involving resizing or allocation. ...
Definition: kaldi-matrix.h:49

KALDI_ISINF
#define KALDI_ISINF
Definition: kaldi-math.h:73

kaldi::CuMatrixBase::Sum
Real Sum() const
Definition: cu-matrix.cc:3012

kaldi::nnet1::RandUniform
void RandUniform(BaseFloat mu, BaseFloat range, CuMatrixBase< Real > *mat, struct RandomState *state=NULL)
Fill CuMatrix with random numbers (Uniform distribution): mu = the mean value, range = the &#39;width&#39; of...
Definition: nnet-utils.h:188

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

cu-matrix.h

kaldi::Matrix
A class for storing matrices.
Definition: kaldi-matrix.h:823

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::RandomState
Definition: kaldi-math.h:136

kaldi::nnet1::PosteriorToMatrix
void PosteriorToMatrix(const Posterior &post, const int32 post_dim, CuMatrix< Real > *mat)
Wrapper of PosteriorToMatrix with CuMatrix argument.
Definition: nnet-utils.h:292

kaldi::VectorBase::Min
Real Min() const
Returns the minimum value of any element, or +infinity for the empty vector.
Definition: kaldi-vector.cc:614

posterior.h

kaldi::TransitionModel
Definition: transition-model.h:123

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::CuVectorBase::CopyFromVec
void CopyFromVec(const CuVectorBase< Real > &src)
Copy functions; these will crash if the dimension do not match.
Definition: cu-vector.cc:1078

kaldi::nnet1::ComputeStdDev
Real ComputeStdDev(const CuMatrixBase< Real > &mat)
Get the standard deviation of values in the matrix.
Definition: nnet-utils.h:142

kaldi::VectorBase::MulElements
void MulElements(const VectorBase< Real > &v)
Multiply element-by-element by another vector.
Definition: kaldi-vector.cc:968

transition-model.h

kaldi::CuMatrixBase::MulElements
void MulElements(const CuMatrixBase< Real > &A)
Multiply two matrices elementwise: C = C .* A.
Definition: cu-matrix.cc:667

kaldi::nnet1::BuildIntegerVector
void BuildIntegerVector(const std::vector< std::vector< int32 > > &in, std::vector< int32 > *out)
Build &#39;integer vector&#39; out of vector of &#39;matlab-like&#39; representation: &#39;b, b:e, b:s:e&#39;.
Definition: nnet-utils.h:239

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::VectorBase::Max
Real Max() const
Returns the maximum value of any element, or -infinity for the empty vector.
Definition: kaldi-vector.cc:574

kaldi::nnet1::RandGauss
void RandGauss(BaseFloat mu, BaseFloat sigma, CuMatrixBase< Real > *mat, struct RandomState *state=NULL)
Fill CuMatrix with random numbers (Gaussian distribution): mu = the mean value, sigma = standard devi...
Definition: nnet-utils.h:164

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::Rand
int Rand(struct RandomState *state)
Definition: kaldi-math.cc:45

kaldi::VectorBase::Sum
Real Sum() const
Returns sum of the elements.
Definition: kaldi-vector.cc:688

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ISNAN
#define KALDI_ISNAN
Definition: kaldi-math.h:72

kaldi::CuArray< int32 >

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::VectorBase::CopyRowsFromMat
void CopyRowsFromMat(const MatrixBase< Real > &M)
Performs a row stack of the matrix M.
Definition: kaldi-vector.cc:348

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::VectorBase::Add
void Add(Real c)
Add a constant to each element of a vector.
Definition: kaldi-vector.cc:956

kaldi::CuVectorBase::CopyToVec
void CopyToVec(VectorBase< OtherReal > *dst) const
Definition: cu-vector.cc:938

kaldi-common.h

cu-array.h

kaldi::nnet1::CheckNanInf
void CheckNanInf(const CuMatrixBase< Real > &mat, const char *msg="")
Check that matrix contains no nan or inf.
Definition: nnet-utils.h:132

kaldi::CuVectorBase::Dim
MatrixIndexT Dim() const
Dimensions.
Definition: cu-vector.h:69

kaldi::CuVectorBase
Vector for CUDA computing.
Definition: matrix-common.h:72