doc/nnet-activation_8h_source.html

 // nnet/nnet-activation.h

 // Copyright 2011-2016  Brno University of Technology (author: Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_NNET_NNET_ACTIVATION_H_
 #define KALDI_NNET_NNET_ACTIVATION_H_

 #include <string>
 #include <vector>
 #include <cmath>

 #include "nnet/nnet-component.h"
 #include "nnet/nnet-utils.h"
 #include "cudamatrix/cu-math.h"
 #include "cudamatrix/cu-rand.h"
 #include "util/text-utils.h"

 namespace kaldi {
 namespace nnet1 {

 class Softmax : public Component {
  public:
   Softmax(int32 dim_in, int32 dim_out):
     Component(dim_in, dim_out)
   { }

   ~Softmax()
   { }

   Component* Copy() const { return new Softmax(*this); }
   ComponentType GetType() const { return kSoftmax; }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // y = e^x_j/sum_j(e^x_j)
     out->SoftMaxPerRow(in);
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // simply copy the error derivative
     // (ie. assume crossentropy error function,
     // while in_diff contains (net_output-target) :
     // this is already derivative of the error with
     // respect to activations of last layer neurons)
     in_diff->CopyFromMat(out_diff);
   }
 };


 class HiddenSoftmax : public Component {
  public:
   HiddenSoftmax(int32 dim_in, int32 dim_out) :
     Component(dim_in, dim_out)
   { }

   ~HiddenSoftmax()
   { }

   Component* Copy() const { return new HiddenSoftmax(*this); }
   ComponentType GetType() const { return kHiddenSoftmax; }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // y = e^x_j/sum_j(e^x_j)
     out->SoftMaxPerRow(in);
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // This Softmax should be used for a hidden layer, it calculates
     // the true Jacobian of Softmax: J = diag(out) - out*out^T

     // The backpropagation formual is:
     // in_diff = out_diff \odot out - out(out_diff^T * out)
     // (where \odot is Hadamard product)

     // 1st term, out_diff \odot out,
     in_diff->CopyFromMat(out_diff);
     in_diff->MulElements(out);

     // 2nd term, -out(out_diff^T * out),
     diag_out_diff_out_.Resize(out.NumRows());
     diag_out_diff_out_.AddDiagMatMat(1.0, out_diff, kNoTrans, out, kTrans, 0.0);
     in_diff->AddDiagVecMat(-1.0, diag_out_diff_out_, out, kNoTrans, 1.0);
   }

  private:
   CuVector<BaseFloat> diag_out_diff_out_;
 };

 class BlockSoftmax : public Component {
  public:
   BlockSoftmax(int32 dim_in, int32 dim_out):
     Component(dim_in, dim_out)
   { }

   ~BlockSoftmax()
   { }

   Component* Copy() const { return new BlockSoftmax(*this); }
   ComponentType GetType() const { return kBlockSoftmax; }

   void InitData(std::istream &is) {
     // parse config
     std::string token,
       dims_str;
     while (is >> std::ws, !is.eof()) {
       ReadToken(is, false, &token);
        if (token == "<BlockDims>") is >> dims_str;
       else KALDI_ERR << "Unknown token " << token << ", a typo in config?"
                      << " (BlockDims)";
     }
     // parse dims,
     if (!kaldi::SplitStringToIntegers(dims_str, ",:", false, &block_dims))
       KALDI_ERR << "Invalid block-dims " << dims_str;
     // sanity check
     int32 sum = 0;
     for (int32 i = 0; i < block_dims.size(); i++) {
       sum += block_dims[i];
     }
     KALDI_ASSERT(sum == OutputDim());
   }

   void ReadData(std::istream &is, bool binary) {
     ReadIntegerVector(is, binary, &block_dims);
     block_offset.resize(block_dims.size()+1, 0);
     for (int32 i = 0; i < block_dims.size(); i++) {
       block_offset[i+1] = block_offset[i] + block_dims[i];
     }
     // check
     KALDI_ASSERT(OutputDim() == block_offset[block_offset.size()-1]);
   }

   void WriteData(std::ostream &os, bool binary) const {
     WriteIntegerVector(os, binary, block_dims);
   }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // perform softmax per block:
     for (int32 bl = 0; bl < block_dims.size(); bl++) {
       // get the blocks,
       CuSubMatrix<BaseFloat> in_bl =
         in.ColRange(block_offset[bl], block_dims[bl]);
       CuSubMatrix<BaseFloat> out_bl =
         out->ColRange(block_offset[bl], block_dims[bl]);
       // y = e^x_j/sum_j(e^x_j),
       out_bl.SoftMaxPerRow(in_bl);
     }
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // copy the error derivative:
     // (assuming we already got softmax-cross-entropy derivative in out_diff)
     in_diff->CopyFromMat(out_diff);

     // Set the derivatives to zero for the matrix-lines in which
     // the sum of 'derivatives' was 1.0 (i.e. there was no target):
     for (int32 bl = 0; bl < block_dims.size(); bl++) {
       // get the block,
       CuSubMatrix<BaseFloat> diff_bl =
         in_diff->ColRange(block_offset[bl], block_dims[bl]);
       // get the sum of each row,
       CuVector<BaseFloat> row_sum(diff_bl.NumRows());
       row_sum.AddColSumMat(1.0, diff_bl, 0.0);  // 0: keep as-is, 1: zero-out
       // we'll scale rows by 0/1 masks,
       CuVector<BaseFloat> row_diff_mask(row_sum);
       row_diff_mask.Scale(-1.0);  // 0: keep as-is, -1: zero-out
       row_diff_mask.Add(1.0);  // 1: keep as-is, 0: zero-out
       // here we should have only 0's and 1's,
       diff_bl.MulRowsVec(row_diff_mask);
     }
   }

   std::string Info() const {
     return "\n  softmax-dims " + ToString(block_dims);
   }

   std::vector<int32> block_dims;
   std::vector<int32> block_offset;
 };


 class Sigmoid : public Component {
  public:
   Sigmoid(int32 dim_in, int32 dim_out):
     Component(dim_in, dim_out)
   { }

   ~Sigmoid()
   { }

   Component* Copy() const { return new Sigmoid(*this); }
   ComponentType GetType() const { return kSigmoid; }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // y = 1/(1+e^-x)
     out->Sigmoid(in);
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // ey = y(1-y)ex,
     in_diff->DiffSigmoid(out, out_diff);
   }
 };


 class Tanh : public Component {
  public:
   Tanh(int32 dim_in, int32 dim_out):
     Component(dim_in, dim_out)
   { }

   ~Tanh()
   { }

   Component* Copy() const { return new Tanh(*this); }
   ComponentType GetType() const { return kTanh; }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // y = (e^x - e^(-x)) / (e^x + e^(-x)),
     out->Tanh(in);
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // ey = (1 - y^2)ex
     in_diff->DiffTanh(out, out_diff);
   }
 };


 class Dropout : public Component {
  public:
   Dropout(int32 dim_in, int32 dim_out):
       Component(dim_in, dim_out),
       dropout_rate_(0.5)
   { }

   ~Dropout()
   { }

   Component* Copy() const { return new Dropout(*this); }
   ComponentType GetType() const { return kDropout; }

   void InitData(std::istream &is) {
     is >> std::ws;  // eat-up whitespace
     // parse config
     std::string token;
     while (is >> std::ws, !is.eof()) {
       ReadToken(is, false, &token);
        if (token == "<DropoutRate>") ReadBasicType(is, false, &dropout_rate_);
       else KALDI_ERR << "Unknown token " << token << ", a typo in config?"
                      << " (DropoutRate)";
     }
     KALDI_ASSERT(dropout_rate_ >= 0.0 && dropout_rate_ < 1.0);
   }

   void ReadData(std::istream &is, bool binary) {
     // Read all the '<Tokens>' in arbitrary order,
     bool finished = false;
     while ('<' == Peek(is, binary) && !finished) {
       std::string token;
       int first_char = PeekToken(is, binary);
       switch (first_char) {
         case 'D': ReadToken(is, false, &token);
            if (token == "<DropoutRate>") ReadBasicType(is, binary, &dropout_rate_);
           else if (token == "<DropoutRetention>") { /* compatibility */
             BaseFloat dropout_retention;
             ReadBasicType(is, binary, &dropout_retention);
             dropout_rate_ = 1.0 - dropout_retention;
           } else KALDI_ERR << "Unknown token: " << token;
           break;
         case '!': ExpectToken(is, binary, "<!EndOfComponent>");
           finished = true;
           break;
         default: ReadToken(is, false, &token);
           KALDI_ERR << "Unknown token: " << token;
       }
     }
     KALDI_ASSERT(dropout_rate_ >= 0.0 && dropout_rate_ < 1.0);
   }

   void WriteData(std::ostream &os, bool binary) const {
     WriteToken(os, binary, "<DropoutRate>");
     WriteBasicType(os, binary, dropout_rate_);
   }

   std::string Info() const {
     return std::string("<DropoutRate> ") + ToString(dropout_rate_);
   }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     out->CopyFromMat(in);
     // set N inputs to zero, according to the 'dropout_rate_' ...
     dropout_mask_.Resize(out->NumRows(), out->NumCols());
     rand_.RandUniform(&dropout_mask_);  // [0..1]
     dropout_mask_.Add(-dropout_rate_);  // [(-rate)..(1-rate)]
     dropout_mask_.Heaviside(dropout_mask_); // (x > 0.0 ? 1 : 0)
     out->MulElements(dropout_mask_);
     // rescale to keep the same dynamic range as w/o dropout,
     out->Scale(1.0 / (1.0 - dropout_rate_));
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     in_diff->CopyFromMat(out_diff);
     // use same mask on the error derivatives...
     in_diff->MulElements(dropout_mask_);
     // enlarge the output to fit same dynamic range as w/o dropout
     in_diff->Scale(1.0 / (1.0 - dropout_rate_));
   }

   BaseFloat GetDropoutRate() { return dropout_rate_; }

   void SetDropoutRate(BaseFloat dr) {
     dropout_rate_ = dr;
     KALDI_ASSERT(dropout_rate_ >= 0.0 && dropout_rate_ < 1.0);
   }

  private:
   BaseFloat dropout_rate_;

   CuRand<BaseFloat> rand_;

   CuMatrix<BaseFloat> dropout_mask_;  // random binary mask,
                                       // 1 = keep neuron, 0 = drop neuron,
 };

 }  // namespace nnet1
 }  // namespace kaldi

 #endif  // KALDI_NNET_NNET_ACTIVATION_H_

kaldi::nnet1::ToString
std::string ToString(const T &t)
Convert basic type to a string (please don&#39;t overuse),.
Definition: nnet-utils.h:52

kaldi::CuRand
Definition: cu-common.h:152

kaldi::nnet1::HiddenSoftmax::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-activation.h:79

kaldi::nnet1::Tanh
Definition: nnet-activation.h:240

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::BlockSoftmax::Info
std::string Info() const
Print some additional info (after <ComponentName> and the dims),.
Definition: nnet-activation.h:200

kaldi::nnet1::Component::kSoftmax
Definition: nnet-component.h:59

cu-rand.h

kaldi::nnet1::Softmax::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-activation.h:55

kaldi::nnet1::Dropout::WriteData
void WriteData(std::ostream &os, bool binary) const
Writes the component content.
Definition: nnet-activation.h:320

kaldi::nnet1::Dropout::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-activation.h:279

kaldi::nnet1::Softmax::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-activation.h:46

kaldi::nnet1::Tanh::~Tanh
~Tanh()
Definition: nnet-activation.h:246

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::nnet1::Dropout::InitData
void InitData(std::istream &is)
Virtual interface for initialization and I/O,.
Definition: nnet-activation.h:282

kaldi::nnet1::BlockSoftmax::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-activation.h:122

kaldi::nnet1::Tanh::Tanh
Tanh(int32 dim_in, int32 dim_out)
Definition: nnet-activation.h:242

kaldi::nnet1::Dropout::GetDropoutRate
BaseFloat GetDropoutRate()
Definition: nnet-activation.h:353

kaldi::nnet1::Sigmoid::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-activation.h:221

kaldi::nnet1::BlockSoftmax::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-activation.h:174

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::CuVectorBase::Add
void Add(Real value)
Definition: cu-vector.cc:1157

kaldi::SplitStringToIntegers
bool SplitStringToIntegers(const std::string &full, const char *delim, bool omit_empty_strings, std::vector< I > *out)
Split a string (e.g.
Definition: text-utils.h:68

kaldi::nnet1::BlockSoftmax::InitData
void InitData(std::istream &is)
Virtual interface for initialization and I/O,.
Definition: nnet-activation.h:125

kaldi::nnet1::Sigmoid::~Sigmoid
~Sigmoid()
Definition: nnet-activation.h:217

kaldi::nnet1::Dropout::rand_
CuRand< BaseFloat > rand_
generator of random numbers,
Definition: nnet-activation.h:363

kaldi::nnet1::Sigmoid::Sigmoid
Sigmoid(int32 dim_in, int32 dim_out)
Definition: nnet-activation.h:213

kaldi::nnet1::Dropout::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-activation.h:342

kaldi::nnet1::Dropout::Info
std::string Info() const
Print some additional info (after <ComponentName> and the dims),.
Definition: nnet-activation.h:325

kaldi::nnet1::Component::kSigmoid
Definition: nnet-component.h:62

kaldi::nnet1::Dropout::dropout_mask_
CuMatrix< BaseFloat > dropout_mask_
Definition: nnet-activation.h:365

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet1::BlockSoftmax
Definition: nnet-activation.h:113

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet1::BlockSoftmax::block_offset
std::vector< int32 > block_offset
Definition: nnet-activation.h:205

nnet-component.h

kaldi::nnet1::Softmax::~Softmax
~Softmax()
Definition: nnet-activation.h:43

kaldi::nnet1::HiddenSoftmax::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-activation.h:78

kaldi::nnet1::BlockSoftmax::BlockSoftmax
BlockSoftmax(int32 dim_in, int32 dim_out)
Definition: nnet-activation.h:115

kaldi::Peek
int Peek(std::istream &is, bool binary)
Peek consumes whitespace (if binary == false) and then returns the peek() value of the stream...
Definition: io-funcs.cc:145

kaldi::nnet1::Tanh::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-activation.h:249

kaldi::nnet1::Component::ComponentType
ComponentType
Component type identification mechanism,.
Definition: nnet-component.h:47

kaldi::nnet1::Sigmoid::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-activation.h:229

kaldi::nnet1::Tanh::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-activation.h:252

kaldi::nnet1::Dropout::SetDropoutRate
void SetDropoutRate(BaseFloat dr)
Definition: nnet-activation.h:355

text-utils.h

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::nnet1::Component::kBlockSoftmax
Definition: nnet-component.h:61

kaldi::CuMatrixBase::Scale
void Scale(Real value)
Definition: cu-matrix.cc:644

kaldi::nnet1::Softmax::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-activation.h:49

kaldi::nnet1::BlockSoftmax::~BlockSoftmax
~BlockSoftmax()
Definition: nnet-activation.h:119

kaldi::ReadIntegerVector
void ReadIntegerVector(std::istream &is, bool binary, std::vector< T > *v)
Function for reading STL vector of integer types.
Definition: io-funcs-inl.h:232

kaldi::nnet1::Softmax::Softmax
Softmax(int32 dim_in, int32 dim_out)
Definition: nnet-activation.h:39

float

kaldi::CuVectorBase::AddColSumMat
void AddColSumMat(Real alpha, const CuMatrixBase< Real > &mat, Real beta=1.0)
Sum the columns of the matrix, add to vector.
Definition: cu-vector.cc:1298

kaldi::CuMatrixBase::Sigmoid
void Sigmoid(const CuMatrixBase< Real > &src)
Set each element to the sigmoid of the corresponding element of "src": element by element...
Definition: cu-matrix.cc:1534

kaldi::nnet1::Sigmoid
Definition: nnet-activation.h:211

kaldi::nnet1::Dropout::dropout_rate_
BaseFloat dropout_rate_
probability that a neuron is dropped,
Definition: nnet-activation.h:361

kaldi::ExpectToken
void ExpectToken(std::istream &is, bool binary, const char *token)
ExpectToken tries to read in the given token, and throws an exception on failure. ...
Definition: io-funcs.cc:191

kaldi::CuMatrixBase::SoftMaxPerRow
void SoftMaxPerRow(const CuMatrixBase< Real > &src)
Softmax nonlinearity Y = Softmax(X) : Yij = e^Xij / sum_k(e^Xik), done to each row, with attention to avoiding overflow or underflow.
Definition: cu-matrix.cc:1717

kaldi::CuMatrixBase::MulElements
void MulElements(const CuMatrixBase< Real > &A)
Multiply two matrices elementwise: C = C .* A.
Definition: cu-matrix.cc:667

kaldi::nnet1::HiddenSoftmax::~HiddenSoftmax
~HiddenSoftmax()
Definition: nnet-activation.h:75

kaldi::nnet1::HiddenSoftmax
Definition: nnet-activation.h:69

kaldi::nnet1::Softmax::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-activation.h:47

kaldi::nnet1::Tanh::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-activation.h:258

kaldi::nnet1::BlockSoftmax::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-activation.h:123

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::nnet1::Dropout
Definition: nnet-activation.h:269

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

kaldi::nnet1::BlockSoftmax::WriteData
void WriteData(std::ostream &os, bool binary) const
Writes the component content.
Definition: nnet-activation.h:156

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::nnet1::HiddenSoftmax::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-activation.h:87

kaldi::PeekToken
int PeekToken(std::istream &is, bool binary)
PeekToken will return the first character of the next token, or -1 if end of file.
Definition: io-funcs.cc:170

kaldi::nnet1::Dropout::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-activation.h:280

kaldi::nnet1::Sigmoid::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-activation.h:220

kaldi::nnet1::Component::kDropout
Definition: nnet-component.h:65

kaldi::nnet1::Tanh::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-activation.h:250

kaldi::CuMatrixBase::DiffTanh
void DiffTanh(const CuMatrixBase< Real > &value, const CuMatrixBase< Real > &diff)
Differentiate backward through the tanh function.
Definition: cu-matrix.cc:1809

kaldi::nnet1::BlockSoftmax::block_dims
std::vector< int32 > block_dims
Definition: nnet-activation.h:204

kaldi::nnet1::Softmax
Definition: nnet-activation.h:37

kaldi::nnet1::Dropout::~Dropout
~Dropout()
Definition: nnet-activation.h:276

kaldi::CuMatrixBase::DiffSigmoid
void DiffSigmoid(const CuMatrixBase< Real > &value, const CuMatrixBase< Real > &diff)
Differentiate backward through the sigmoid function.
Definition: cu-matrix.cc:1764

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet1::Component::kHiddenSoftmax
Definition: nnet-component.h:60

kaldi::CuMatrixBase::ColRange
CuSubMatrix< Real > ColRange(const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Definition: cu-matrix.h:665

cu-math.h

kaldi::nnet1::BlockSoftmax::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-activation.h:160

kaldi::nnet1::Dropout::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-activation.h:329

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::nnet1::Dropout::Dropout
Dropout(int32 dim_in, int32 dim_out)
Definition: nnet-activation.h:271

kaldi::nnet1::HiddenSoftmax::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-activation.h:81

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet1::HiddenSoftmax::diag_out_diff_out_
CuVector< BaseFloat > diag_out_diff_out_
buffer for dot-products in BackpropagateFnc,
Definition: nnet-activation.h:110

kaldi::CuVectorBase::Scale
void Scale(Real value)
Definition: cu-vector.cc:1216

kaldi::WriteIntegerVector
void WriteIntegerVector(std::ostream &os, bool binary, const std::vector< T > &v)
Function for writing STL vectors of integer types.
Definition: io-funcs-inl.h:198

kaldi::nnet1::Dropout::ReadData
void ReadData(std::istream &is, bool binary)
Reads the component content.
Definition: nnet-activation.h:295

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet1::Component
Abstract class, building block of the network.
Definition: nnet-component.cc:51

kaldi::nnet1::HiddenSoftmax::HiddenSoftmax
HiddenSoftmax(int32 dim_in, int32 dim_out)
Definition: nnet-activation.h:71

kaldi::nnet1::Component::OutputDim
int32 OutputDim() const
Get the dimension of the output,.
Definition: nnet-component.h:135

kaldi::nnet1::Sigmoid::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-activation.h:223

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::nnet1::BlockSoftmax::ReadData
void ReadData(std::istream &is, bool binary)
Reads the component content.
Definition: nnet-activation.h:146

kaldi::CuMatrixBase::Tanh
void Tanh(const CuMatrixBase< Real > &src)
Compute the hyperbolic tangent (tanh) function; element by element, *this = tanh(src).
Definition: cu-matrix.cc:1786

nnet-utils.h

kaldi::CuMatrixBase::MulRowsVec
void MulRowsVec(const CuVectorBase< Real > &scale)
scale i&#39;th row by scale[i]
Definition: cu-matrix.cc:792

kaldi::CuMatrixBase::AddDiagVecMat
void AddDiagVecMat(const Real alpha, const CuVectorBase< Real > &v, const CuMatrixBase< Real > &M, MatrixTransposeType transM, Real beta=1.0)
*this = beta * *this + alpha * diag(v) * M [or M^T].
Definition: cu-matrix.cc:1382

kaldi::nnet1::Component::kTanh
Definition: nnet-component.h:63