doc/nnet-linear-transform_8h_source.html

 // nnet/nnet-linear-transform.h

 // Copyright 2011-2014  Brno University of Technology (author: Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_NNET_NNET_LINEAR_TRANSFORM_H_
 #define KALDI_NNET_NNET_LINEAR_TRANSFORM_H_

 #include <string>

 #include "nnet/nnet-component.h"
 #include "nnet/nnet-utils.h"
 #include "cudamatrix/cu-math.h"

 namespace kaldi {
 namespace nnet1 {

 class LinearTransform : public UpdatableComponent {
  public:
   LinearTransform(int32 dim_in, int32 dim_out):
     UpdatableComponent(dim_in, dim_out),
     linearity_(dim_out, dim_in),
     linearity_corr_(dim_out, dim_in)
   { }

   ~LinearTransform()
   { }

   Component* Copy() const { return new LinearTransform(*this); }
   ComponentType GetType() const { return kLinearTransform; }

   void InitData(std::istream &is) {
     // define options
     float param_stddev = 0.1;
     std::string read_matrix_file;
     // parse config
     std::string token;
     while (is >> std::ws, !is.eof()) {
       ReadToken(is, false, &token);
        if (token == "<ParamStddev>") ReadBasicType(is, false, &param_stddev);
       else if (token == "<ReadMatrix>") ReadToken(is, false, &read_matrix_file);
       else if (token == "<LearnRateCoef>") ReadBasicType(is, false, &learn_rate_coef_);
       else KALDI_ERR << "Unknown token " << token << ", a typo in config?"
                      << " (ParamStddev|ReadMatrix|LearnRateCoef)";
     }

     if (read_matrix_file != "") {  // load from file,
       bool binary;
       Input in(read_matrix_file, &binary);
       linearity_.Read(in.Stream(), binary);
       in.Close();
       // check dims,
       if (OutputDim() != linearity_.NumRows() ||
           InputDim() != linearity_.NumCols()) {
         KALDI_ERR << "Dimensionality mismatch! Expected matrix"
                   << " r=" << OutputDim() << " c=" << InputDim()
                   << ", loaded matrix " << read_matrix_file
                   << " with r=" << linearity_.NumRows()
                   << " c=" << linearity_.NumCols();
       }
       KALDI_LOG << "Loaded <LinearTransform> matrix from file : "
                 << read_matrix_file;
       return;
     }

     //
     // Initialize trainable parameters,
     //
     // Gaussian with given std_dev (mean = 0),
     linearity_.Resize(OutputDim(), InputDim());
     RandGauss(0.0, param_stddev, &linearity_);
   }

   void ReadData(std::istream &is, bool binary) {
     // Read all the '<Tokens>' in arbitrary order,
     while ('<' == Peek(is, binary)) {
       int first_char = PeekToken(is, binary);
       switch (first_char) {
         case 'L': ExpectToken(is, binary, "<LearnRateCoef>");
           ReadBasicType(is, binary, &learn_rate_coef_);
           break;
         default:
           std::string token;
           ReadToken(is, false, &token);
           KALDI_ERR << "Unknown token: " << token;
       }
     }
     // Read the data (data follow the tokens),

     // weights
     linearity_.Read(is, binary);

     KALDI_ASSERT(linearity_.NumRows() == output_dim_);
     KALDI_ASSERT(linearity_.NumCols() == input_dim_);
   }

   void WriteData(std::ostream &os, bool binary) const {
     WriteToken(os, binary, "<LearnRateCoef>");
     WriteBasicType(os, binary, learn_rate_coef_);
     if (!binary) os << "\n";
     linearity_.Write(os, binary);
   }

   int32 NumParams() const {
     return linearity_.NumRows()*linearity_.NumCols();
   }

   void GetGradient(VectorBase<BaseFloat>* gradient) const {
     KALDI_ASSERT(gradient->Dim() == NumParams());
     gradient->CopyRowsFromMat(linearity_corr_);
   }

   void GetParams(VectorBase<BaseFloat>* params) const {
     KALDI_ASSERT(params->Dim() == NumParams());
     params->CopyRowsFromMat(linearity_);
   }

   void SetParams(const VectorBase<BaseFloat>& params) {
     KALDI_ASSERT(params.Dim() == NumParams());
     linearity_.CopyRowsFromVec(params);
   }

   void SetLinearity(const MatrixBase<BaseFloat>& l) {
     KALDI_ASSERT(l.NumCols() == linearity_.NumCols());
     KALDI_ASSERT(l.NumRows() == linearity_.NumRows());
     linearity_.CopyFromMat(l);
   }

   std::string Info() const {
     return std::string("\n  linearity") +
       MomentStatistics(linearity_) +
       ", lr-coef " + ToString(learn_rate_coef_);
   }
   std::string InfoGradient() const {
     return std::string("\n  linearity_grad") +
       MomentStatistics(linearity_corr_) +
       ", lr-coef " + ToString(learn_rate_coef_);
   }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // multiply by weights^t
     out->AddMatMat(1.0, in, kNoTrans, linearity_, kTrans, 0.0);
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // multiply error derivative by weights
     in_diff->AddMatMat(1.0, out_diff, kNoTrans, linearity_, kNoTrans, 0.0);
   }


   void Update(const CuMatrixBase<BaseFloat> &input,
               const CuMatrixBase<BaseFloat> &diff) {
     // we use following hyperparameters from the option class
     const BaseFloat lr = opts_.learn_rate;
     const BaseFloat mmt = opts_.momentum;
     const BaseFloat l2 = opts_.l2_penalty;
     const BaseFloat l1 = opts_.l1_penalty;
     // we will also need the number of frames in the mini-batch
     const int32 num_frames = input.NumRows();
     // compute gradient (incl. momentum)
     linearity_corr_.AddMatMat(1.0, diff, kTrans, input, kNoTrans, mmt);
     // l2 regularization
     if (l2 != 0.0) {
       linearity_.AddMat(-lr*l2*num_frames, linearity_);
     }
     // l1 regularization
     if (l1 != 0.0) {
       cu::RegularizeL1(&linearity_, &linearity_corr_, lr*l1*num_frames, lr);
     }
     // update
     linearity_.AddMat(-lr*learn_rate_coef_, linearity_corr_);
   }

   const CuMatrixBase<BaseFloat>& GetLinearity() { return linearity_; }

   void SetLinearity(const CuMatrixBase<BaseFloat>& linearity) {
     KALDI_ASSERT(linearity.NumRows() == linearity_.NumRows());
     KALDI_ASSERT(linearity.NumCols() == linearity_.NumCols());
     linearity_.CopyFromMat(linearity);
   }

   const CuMatrixBase<BaseFloat>& GetLinearityCorr() { return linearity_corr_; }

  private:
   CuMatrix<BaseFloat> linearity_;
   CuMatrix<BaseFloat> linearity_corr_;
 };

 }  // namespace nnet1
 }  // namespace kaldi

 #endif  // KALDI_NNET_NNET_LINEAR_TRANSFORM_H_
kaldi::nnet1::ToString
std::string ToString(const T &t)
Convert basic type to a string (please don&#39;t overuse),.
Definition: nnet-utils.h:52

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::LinearTransform::InfoGradient
std::string InfoGradient() const
Print some additional info about gradient (after <...> and dims),.
Definition: nnet-linear-transform.h:149

kaldi::nnet1::NnetTrainOptions::learn_rate
BaseFloat learn_rate
Definition: nnet-trnopts.h:32

kaldi::nnet1::LinearTransform::GetParams
void GetParams(VectorBase< BaseFloat > *params) const
Get the trainable parameters reshaped as a vector,.
Definition: nnet-linear-transform.h:128

kaldi::Input
Definition: kaldi-io.h:190

kaldi::nnet1::UpdatableComponent::opts_
NnetTrainOptions opts_
Option-class with training hyper-parameters,.
Definition: nnet-component.h:265

kaldi::nnet1::MomentStatistics
std::string MomentStatistics(const VectorBase< Real > &vec)
Get a string with statistics of the data in a vector, so we can print them easily.
Definition: nnet-utils.h:63

kaldi::nnet1::Component::input_dim_
int32 input_dim_
Data members,.
Definition: nnet-component.h:190

kaldi::nnet1::LinearTransform::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-linear-transform.h:45

kaldi::nnet1::LinearTransform::~LinearTransform
~LinearTransform()
Definition: nnet-linear-transform.h:41

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::MatrixBase
Base class which provides matrix operations not involving resizing or allocation. ...
Definition: kaldi-matrix.h:49

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet1::NnetTrainOptions::momentum
BaseFloat momentum
Definition: nnet-trnopts.h:33

kaldi::nnet1::Component::kLinearTransform
Definition: nnet-component.h:52

kaldi::nnet1::UpdatableComponent::learn_rate_coef_
BaseFloat learn_rate_coef_
Scalar applied to learning rate for weight matrices (to be used in ::Update method),.
Definition: nnet-component.h:269

kaldi::nnet1::LinearTransform::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-linear-transform.h:44

kaldi::nnet1::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters, it contains SGD training hype...
Definition: nnet-component.h:208

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet1::LinearTransform::WriteData
void WriteData(std::ostream &os, bool binary) const
Writes the component content.
Definition: nnet-linear-transform.h:112

kaldi::nnet1::LinearTransform::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-linear-transform.h:161

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet1::LinearTransform::Info
std::string Info() const
Print some additional info (after <ComponentName> and the dims),.
Definition: nnet-linear-transform.h:144

nnet-component.h

kaldi::nnet1::LinearTransform::LinearTransform
LinearTransform(int32 dim_in, int32 dim_out)
Definition: nnet-linear-transform.h:35

kaldi::nnet1::LinearTransform::NumParams
int32 NumParams() const
Number of trainable parameters,.
Definition: nnet-linear-transform.h:119

kaldi::Peek
int Peek(std::istream &is, bool binary)
Peek consumes whitespace (if binary == false) and then returns the peek() value of the stream...
Definition: io-funcs.cc:145

kaldi::nnet1::Component::ComponentType
ComponentType
Component type identification mechanism,.
Definition: nnet-component.h:47

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::nnet1::LinearTransform::Update
void Update(const CuMatrixBase< BaseFloat > &input, const CuMatrixBase< BaseFloat > &diff)
Compute gradient and update parameters,.
Definition: nnet-linear-transform.h:170

kaldi::nnet1::LinearTransform::linearity_corr_
CuMatrix< BaseFloat > linearity_corr_
Definition: nnet-linear-transform.h:206

kaldi::Input::Stream
std::istream & Stream()
Definition: kaldi-io.cc:826

float

kaldi::nnet1::LinearTransform::linearity_
CuMatrix< BaseFloat > linearity_
Definition: nnet-linear-transform.h:205

kaldi::ExpectToken
void ExpectToken(std::istream &is, bool binary, const char *token)
ExpectToken tries to read in the given token, and throws an exception on failure. ...
Definition: io-funcs.cc:191

kaldi::nnet1::LinearTransform::SetLinearity
void SetLinearity(const MatrixBase< BaseFloat > &l)
Definition: nnet-linear-transform.h:138

kaldi::nnet1::Component::InputDim
int32 InputDim() const
Get the dimension of the input,.
Definition: nnet-component.h:130

kaldi::nnet1::LinearTransform::GetLinearityCorr
const CuMatrixBase< BaseFloat > & GetLinearityCorr()
Definition: nnet-linear-transform.h:202

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::nnet1::RandGauss
void RandGauss(BaseFloat mu, BaseFloat sigma, CuMatrixBase< Real > *mat, struct RandomState *state=NULL)
Fill CuMatrix with random numbers (Gaussian distribution): mu = the mean value, sigma = standard devi...
Definition: nnet-utils.h:164

kaldi::nnet1::NnetTrainOptions::l2_penalty
BaseFloat l2_penalty
Definition: nnet-trnopts.h:34

kaldi::CuMatrixBase::AddMatMat
void AddMatMat(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType transA, const CuMatrixBase< Real > &B, MatrixTransposeType transB, Real beta)
C = alpha * A(^T)*B(^T) + beta * C.
Definition: cu-matrix.cc:1291

kaldi::Input::Close
int32 Close()
Definition: kaldi-io.cc:761

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::nnet1::NnetTrainOptions::l1_penalty
BaseFloat l1_penalty
Definition: nnet-trnopts.h:35

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::nnet1::LinearTransform::SetLinearity
void SetLinearity(const CuMatrixBase< BaseFloat > &linearity)
Definition: nnet-linear-transform.h:196

kaldi::nnet1::LinearTransform::SetParams
void SetParams(const VectorBase< BaseFloat > &params)
Set the trainable parameters from, reshaped as a vector,.
Definition: nnet-linear-transform.h:133

kaldi::PeekToken
int PeekToken(std::istream &is, bool binary)
PeekToken will return the first character of the next token, or -1 if end of file.
Definition: io-funcs.cc:170

kaldi::nnet1::LinearTransform
Definition: nnet-linear-transform.h:33

kaldi::nnet1::Component::output_dim_
int32 output_dim_
Dimension of the output of the Component,.
Definition: nnet-component.h:191

cu-math.h

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet1::LinearTransform::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-linear-transform.h:155

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::VectorBase::CopyRowsFromMat
void CopyRowsFromMat(const MatrixBase< Real > &M)
Performs a row stack of the matrix M.
Definition: kaldi-vector.cc:348

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet1::Component
Abstract class, building block of the network.
Definition: nnet-component.cc:51

kaldi::nnet1::LinearTransform::ReadData
void ReadData(std::istream &is, bool binary)
Reads the component content.
Definition: nnet-linear-transform.h:89

kaldi::nnet1::LinearTransform::InitData
void InitData(std::istream &is)
Initialize the content of the component by the &#39;line&#39; from the prototype,.
Definition: nnet-linear-transform.h:47

kaldi::nnet1::Component::OutputDim
int32 OutputDim() const
Get the dimension of the output,.
Definition: nnet-component.h:135

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::nnet1::LinearTransform::GetGradient
void GetGradient(VectorBase< BaseFloat > *gradient) const
Get gradient reshaped as a vector,.
Definition: nnet-linear-transform.h:123

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

nnet-utils.h

kaldi::nnet1::LinearTransform::GetLinearity
const CuMatrixBase< BaseFloat > & GetLinearity()
Accessors to the component parameters.
Definition: nnet-linear-transform.h:194

kaldi::cu::RegularizeL1
void RegularizeL1(CuMatrixBase< Real > *weight, CuMatrixBase< Real > *grad, Real l1, Real lr)
RegularizeL1 is a gradient step with l1 regularization added to the gradient.
Definition: cu-math.cc:37