doc/nnet-parametric-relu_8h_source.html

 // nnet/nnet-parametric-relu.h

 // Copyright 2016 Brno University of Technology (author: Murali Karthick B)
 //           2011-2014  Brno University of Technology (author: Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_NNET_NNET_PARAMETRIC_RELU_H_
 #define KALDI_NNET_NNET_PARAMETRIC_RELU_H_

 #include <string>

 #include "nnet/nnet-component.h"
 #include "nnet/nnet-utils.h"
 #include "cudamatrix/cu-math.h"

 namespace kaldi {
 namespace nnet1 {

 class ParametricRelu : public UpdatableComponent {
  public:
   ParametricRelu(int32 dim_in, int32 dim_out):
     UpdatableComponent(dim_in, dim_out),
     alpha_(dim_out),
     beta_(dim_out),
     alpha_corr_(dim_out),
     beta_corr_(dim_out),
     alpha_learn_rate_coef_(0.0),
     beta_learn_rate_coef_(0.0)
   { }

   ~ParametricRelu()
   { }

   Component* Copy() const { return new ParametricRelu(*this); }
   ComponentType GetType() const { return kParametricRelu; }

   void InitData(std::istream &is) {
     // define options
     BaseFloat alpha = 1.0, beta = 0.0;

     // parse config
     std::string token;
     while (is >> std::ws, !is.eof()) {
       ReadToken(is, false, &token);
        if (token == "<Alpha>") ReadBasicType(is, false, &alpha);
       else if (token == "<Beta>") ReadBasicType(is, false, &beta);
       else if (token == "<AlphaLearnRateCoef>") ReadBasicType(is, false, &alpha_learn_rate_coef_);
       else if (token == "<BetaLearnRateCoef>") ReadBasicType(is, false, &beta_learn_rate_coef_);
       else KALDI_ERR << "Unknown token " << token << ", a typo in config?"
                   << " (Alpha|Beta|AlphaLearnRateCoef|BetaLearnRateCoef)";
     }

     // Initialize trainable parameters,
     alpha_.Set(alpha);
     beta_.Set(beta);
   }

   void ReadData(std::istream &is, bool binary) {
     // Read all the '<Tokens>' in arbitrary order,
     while ('<' == Peek(is, binary)) {
       int first_char = PeekToken(is, binary);
       switch (first_char) {
         case 'A': ExpectToken(is, binary, "<AlphaLearnRateCoef>");
           ReadBasicType(is, binary, &alpha_learn_rate_coef_);
           break;
         case 'B': ExpectToken(is, binary, "<BetaLearnRateCoef>");
           ReadBasicType(is, binary, &beta_learn_rate_coef_);
           break;
         default:
           std::string token;
           ReadToken(is, false, &token);
           KALDI_ERR << "Unknown token: " << token;
       }
     }
     // ParametricRelu scaling parameters
     alpha_.Read(is, binary);
     beta_.Read(is, binary);
     KALDI_ASSERT(alpha_.Dim() == output_dim_);
     KALDI_ASSERT(beta_.Dim() == output_dim_);
   }

   void WriteData(std::ostream &os, bool binary) const {
     WriteToken(os, binary, "<AlphaLearnRateCoef>");
     WriteBasicType(os, binary, alpha_learn_rate_coef_);
     WriteToken(os, binary, "<BetaLearnRateCoef>");
     WriteBasicType(os, binary, beta_learn_rate_coef_);

     // ParametricRelu scales for each neuron,
     if (!binary) os << "\n";
     alpha_.Write(os, binary);
     beta_.Write(os, binary);
   }

   int32 NumParams() const {
     return alpha_.Dim() + beta_.Dim();
   }

   void GetGradient(VectorBase<BaseFloat>* gradient) const {
     KALDI_ASSERT(gradient->Dim() == NumParams());
     int32 alpha_num_elem = alpha_.Dim();
     int32 beta_num_elem = beta_.Dim();
     gradient->Range(0, alpha_num_elem).CopyFromVec(Vector<BaseFloat>(alpha_corr_));
     gradient->Range(alpha_num_elem, beta_num_elem).CopyFromVec(Vector<BaseFloat>(beta_corr_));
   }

   void GetParams(VectorBase<BaseFloat>* params) const {
     KALDI_ASSERT(params->Dim() == NumParams());
     int32 alpha_num_elem = alpha_.Dim();
     int32 beta_num_elem = beta_.Dim();
     params->Range(0, alpha_num_elem).CopyFromVec(Vector<BaseFloat>(alpha_));
     params->Range(alpha_num_elem, beta_num_elem).CopyFromVec(Vector<BaseFloat>(beta_));
   }

   void SetParams(const VectorBase<BaseFloat>& params) {
     KALDI_ASSERT(params.Dim() == NumParams());
     int32 alpha_num_elem = alpha_.Dim();
     int32 beta_num_elem = beta_.Dim();
     alpha_.CopyFromVec(params.Range(0, alpha_num_elem));
     beta_.CopyFromVec(params.Range(alpha_num_elem, beta_num_elem));
   }

   std::string Info() const {
     return std::string("\n  alpha") +
       MomentStatistics(alpha_) +
       ", alpha-lr-coef " + ToString(alpha_learn_rate_coef_) +
       "\n  beta" + MomentStatistics(beta_) +
       ", beta-lr-coef " + ToString(beta_learn_rate_coef_);
   }
   std::string InfoGradient() const {
     return std::string("\n  alpha_grad") +
       MomentStatistics(alpha_corr_) +
       ", alpha-lr-coef " + ToString(alpha_learn_rate_coef_) +
       "\n  beta_grad" + MomentStatistics(beta_corr_) +
       ", beta-lr-coef " + ToString(beta_learn_rate_coef_);
   }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // out = (in < 0.0 ? aplha*in : beta*in)
     out->ParametricRelu(in, alpha_, beta_);
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // in_diff = (in > 0 ? alpha * out_diff : beta * out_diff)
     in_diff->DiffParametricRelu(in, out_diff, alpha_, beta_);
   }

   void Update(const CuMatrixBase<BaseFloat> &input,
               const CuMatrixBase<BaseFloat> &diff) {
     // we use these hyperparameters,
     const BaseFloat alpha_lr = opts_.learn_rate * alpha_learn_rate_coef_;
     const BaseFloat beta_lr = opts_.learn_rate * beta_learn_rate_coef_;
     const BaseFloat mmt = opts_.momentum;

     if (alpha_learn_rate_coef_ > 0.0) {
        // get gradient,
        alpha_aux_ = input;
        alpha_aux_.ApplyFloor(0.0); // masking positive Relu inputs,
        alpha_aux_.MulElements(diff);
        alpha_corr_.AddRowSumMat(1.0, alpha_aux_, mmt);
        // update,
        alpha_.AddVec(-alpha_lr, alpha_corr_);
     }
     if (beta_learn_rate_coef_ > 0.0) {
        // get gradient,
        beta_aux_ = input;
        beta_aux_.ApplyCeiling(0.0); // masking positive Relu inputs,
        beta_aux_.MulElements(diff);
        beta_corr_.AddRowSumMat(1.0, beta_aux_, mmt);
        beta_.AddVec(-beta_lr, beta_corr_);
     }
   }

  private:
   CuVector<BaseFloat> alpha_;
   CuVector<BaseFloat> beta_;

   CuVector<BaseFloat> alpha_corr_;
   CuVector<BaseFloat> beta_corr_;

   CuMatrix<BaseFloat> alpha_aux_;
   CuMatrix<BaseFloat> beta_aux_;

   BaseFloat alpha_learn_rate_coef_;
   BaseFloat beta_learn_rate_coef_;
 };

 }  // namespace nnet1
 }  // namespace kaldi

 #endif  // KALDI_NNET_NNET_PARAMETRIC_RELU_H_
kaldi::nnet1::ToString
std::string ToString(const T &t)
Convert basic type to a string (please don&#39;t overuse),.
Definition: nnet-utils.h:52

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::ParametricRelu::InitData
void InitData(std::istream &is)
Initialize the content of the component by the &#39;line&#39; from the prototype,.
Definition: nnet-parametric-relu.h:52

kaldi::nnet1::ParametricRelu::ReadData
void ReadData(std::istream &is, bool binary)
Reads the component content.
Definition: nnet-parametric-relu.h:73

kaldi::nnet1::NnetTrainOptions::learn_rate
BaseFloat learn_rate
Definition: nnet-trnopts.h:32

kaldi::nnet1::ParametricRelu::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-parametric-relu.h:152

kaldi::nnet1::ParametricRelu::beta_learn_rate_coef_
BaseFloat beta_learn_rate_coef_
Controls learning rate for beta (0.0 disables learning),.
Definition: nnet-parametric-relu.h:207

kaldi::nnet1::ParametricRelu::NumParams
int32 NumParams() const
Number of trainable parameters,.
Definition: nnet-parametric-relu.h:109

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::nnet1::UpdatableComponent::opts_
NnetTrainOptions opts_
Option-class with training hyper-parameters,.
Definition: nnet-component.h:265

kaldi::nnet1::MomentStatistics
std::string MomentStatistics(const VectorBase< Real > &vec)
Get a string with statistics of the data in a vector, so we can print them easily.
Definition: nnet-utils.h:63

kaldi::nnet1::ParametricRelu::WriteData
void WriteData(std::ostream &os, bool binary) const
Writes the component content.
Definition: nnet-parametric-relu.h:97

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet1::NnetTrainOptions::momentum
BaseFloat momentum
Definition: nnet-trnopts.h:33

kaldi::nnet1::ParametricRelu::GetGradient
void GetGradient(VectorBase< BaseFloat > *gradient) const
Get gradient reshaped as a vector,.
Definition: nnet-parametric-relu.h:113

kaldi::nnet1::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters, it contains SGD training hype...
Definition: nnet-component.h:208

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet1::ParametricRelu::alpha_aux_
CuMatrix< BaseFloat > alpha_aux_
Auxiliary matrix for getting &#39;alpha&#39; updates,.
Definition: nnet-parametric-relu.h:200

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet1::ParametricRelu::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-parametric-relu.h:49

nnet-component.h

kaldi::nnet1::ParametricRelu::alpha_
CuVector< BaseFloat > alpha_
Vector of &#39;alphas&#39;, one value per neuron.
Definition: nnet-parametric-relu.h:193

kaldi::Peek
int Peek(std::istream &is, bool binary)
Peek consumes whitespace (if binary == false) and then returns the peek() value of the stream...
Definition: io-funcs.cc:145

kaldi::nnet1::Component::ComponentType
ComponentType
Component type identification mechanism,.
Definition: nnet-component.h:47

kaldi::nnet1::ParametricRelu::SetParams
void SetParams(const VectorBase< BaseFloat > &params)
Set the trainable parameters from, reshaped as a vector,.
Definition: nnet-parametric-relu.h:129

kaldi::nnet1::ParametricRelu::Info
std::string Info() const
Print some additional info (after <ComponentName> and the dims),.
Definition: nnet-parametric-relu.h:137

kaldi::nnet1::Component::kParametricRelu
Definition: nnet-component.h:64

float

kaldi::nnet1::ParametricRelu
Definition: nnet-parametric-relu.h:34

kaldi::nnet1::ParametricRelu::~ParametricRelu
~ParametricRelu()
Definition: nnet-parametric-relu.h:46

kaldi::ExpectToken
void ExpectToken(std::istream &is, bool binary, const char *token)
ExpectToken tries to read in the given token, and throws an exception on failure. ...
Definition: io-funcs.cc:191

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::PeekToken
int PeekToken(std::istream &is, bool binary)
PeekToken will return the first character of the next token, or -1 if end of file.
Definition: io-funcs.cc:170

kaldi::nnet1::ParametricRelu::beta_
CuVector< BaseFloat > beta_
Vector of &#39;betas&#39;, one value per neuron.
Definition: nnet-parametric-relu.h:194

kaldi::nnet1::ParametricRelu::ParametricRelu
ParametricRelu(int32 dim_in, int32 dim_out)
Definition: nnet-parametric-relu.h:36

kaldi::nnet1::ParametricRelu::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-parametric-relu.h:50

kaldi::nnet1::Component::output_dim_
int32 output_dim_
Dimension of the output of the Component,.
Definition: nnet-component.h:191

cu-math.h

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::nnet1::ParametricRelu::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-parametric-relu.h:158

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet1::ParametricRelu::beta_corr_
CuVector< BaseFloat > beta_corr_
Vector of &#39;beta&#39; updates.
Definition: nnet-parametric-relu.h:197

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet1::Component
Abstract class, building block of the network.
Definition: nnet-component.cc:51

kaldi::nnet1::ParametricRelu::beta_aux_
CuMatrix< BaseFloat > beta_aux_
Auxiliary matrix for getting &#39;beta&#39; updates,.
Definition: nnet-parametric-relu.h:202

kaldi::nnet1::ParametricRelu::Update
void Update(const CuMatrixBase< BaseFloat > &input, const CuMatrixBase< BaseFloat > &diff)
Compute gradient and update parameters,.
Definition: nnet-parametric-relu.h:166

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

nnet-utils.h

kaldi::CuMatrixBase::ParametricRelu
void ParametricRelu(const CuMatrixBase< Real > &src, const CuVectorBase< Real > &alpha, const CuVectorBase< Real > &beta)
Compute the parametric rectified linear unit function; element by element, *this = src * (src > 0 ...
Definition: cu-matrix.cc:1467

kaldi::CuMatrixBase::DiffParametricRelu
void DiffParametricRelu(const CuMatrixBase< Real > &value, const CuMatrixBase< Real > &diff, const CuVectorBase< Real > &alpha, const CuVectorBase< Real > &beta)
Differentiate backward through the parametric relu function.
Definition: cu-matrix.cc:1501

kaldi::nnet1::ParametricRelu::InfoGradient
std::string InfoGradient() const
Print some additional info about gradient (after <...> and dims),.
Definition: nnet-parametric-relu.h:144

kaldi::nnet1::ParametricRelu::alpha_corr_
CuVector< BaseFloat > alpha_corr_
Vector of &#39;alpha&#39; updates.
Definition: nnet-parametric-relu.h:196

kaldi::nnet1::ParametricRelu::alpha_learn_rate_coef_
BaseFloat alpha_learn_rate_coef_
Controls learning rate for alpha (0.0 disables learning),.
Definition: nnet-parametric-relu.h:205

kaldi::nnet1::ParametricRelu::GetParams
void GetParams(VectorBase< BaseFloat > *params) const
Get the trainable parameters reshaped as a vector,.
Definition: nnet-parametric-relu.h:121

kaldi::VectorBase::Range
SubVector< Real > Range(const MatrixIndexT o, const MatrixIndexT l)
Returns a sub-vector of a vector (a range of elements).
Definition: kaldi-vector.h:94