doc/nnet-parallel-component_8h_source.html

 // nnet/nnet-parallel-component.h

 // Copyright 2014  Brno University of Technology (Author: Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_NNET_NNET_PARALLEL_COMPONENT_H_
 #define KALDI_NNET_NNET_PARALLEL_COMPONENT_H_

 #include <string>
 #include <vector>
 #include <sstream>

 #include "nnet/nnet-component.h"
 #include "nnet/nnet-utils.h"
 #include "cudamatrix/cu-math.h"


 namespace kaldi {
 namespace nnet1 {

 class ParallelComponent : public MultistreamComponent {
  public:
   ParallelComponent(int32 dim_in, int32 dim_out):
     MultistreamComponent(dim_in, dim_out)
   { }

   ~ParallelComponent()
   { }

   Component* Copy() const { return new ParallelComponent(*this); }
   ComponentType GetType() const { return kParallelComponent; }

   const Nnet& GetNestedNnet(int32 id) const { return nnet_.at(id); }
   Nnet& GetNestedNnet(int32 id) { return nnet_.at(id); }

   void InitData(std::istream &is) {
     // define options
     std::vector<std::string> nested_nnet_proto;
     std::vector<std::string> nested_nnet_filename;
     // parse config
     std::string token;
     while (is >> std::ws, !is.eof()) {
       ReadToken(is, false, &token);
        if (token == "<NestedNnet>" || token == "<NestedNnetFilename>") {
         while (is >> std::ws, !is.eof()) {
           std::string file_or_end;
           ReadToken(is, false, &file_or_end);
           if (file_or_end == "</NestedNnet>" ||
               file_or_end == "</NestedNnetFilename>") break;
           nested_nnet_filename.push_back(file_or_end);
         }
       } else if (token == "<NestedNnetProto>") {
         while (is >> std::ws, !is.eof()) {
           std::string file_or_end;
           ReadToken(is, false, &file_or_end);
           if (file_or_end == "</NestedNnetProto>") break;
           nested_nnet_proto.push_back(file_or_end);
         }
       } else { KALDI_ERR << "Unknown token " << token << ", typo in config?"
                          << " (NestedNnet|NestedNnetFilename|NestedNnetProto)";
       }
     }
     // Initialize,
     // First, read nnets from files,
     if (nested_nnet_filename.size() > 0) {
       for (int32 i = 0; i < nested_nnet_filename.size(); i++) {
         Nnet nnet;
         nnet.Read(nested_nnet_filename[i]);
         nnet_.push_back(nnet);
         KALDI_LOG << "Loaded nested <Nnet> from file : "
                   << nested_nnet_filename[i];
       }
     }
     // Second, initialize nnets from prototypes,
     if (nested_nnet_proto.size() > 0) {
       for (int32 i = 0; i < nested_nnet_proto.size(); i++) {
         Nnet nnet;
         nnet.Init(nested_nnet_proto[i]);
         nnet_.push_back(nnet);
         KALDI_LOG << "Initialized nested <Nnet> from prototype : "
                   << nested_nnet_proto[i];
       }
     }
     // Check dim-sum of nested nnets,
     int32 nnet_input_sum = 0, nnet_output_sum = 0;
     for (int32 i = 0; i < nnet_.size(); i++) {
       nnet_input_sum += nnet_[i].InputDim();
       nnet_output_sum += nnet_[i].OutputDim();
     }
     KALDI_ASSERT(InputDim() == nnet_input_sum);
     KALDI_ASSERT(OutputDim() == nnet_output_sum);
   }

   void ReadData(std::istream &is, bool binary) {
     // read
     ExpectToken(is, binary, "<NestedNnetCount>");
     int32 nnet_count;
     ReadBasicType(is, binary, &nnet_count);
     for (int32 i = 0; i < nnet_count; i++) {
       ExpectToken(is, binary, "<NestedNnet>");
       int32 dummy;
       ReadBasicType(is, binary, &dummy);
       Nnet nnet;
       nnet.Read(is, binary);
       nnet_.push_back(nnet);
     }
     ExpectToken(is, binary, "</ParallelComponent>");

     // check dim-sum of nested nnets
     int32 nnet_input_sum = 0, nnet_output_sum = 0;
     for (int32 i = 0; i < nnet_.size(); i++) {
       nnet_input_sum += nnet_[i].InputDim();
       nnet_output_sum += nnet_[i].OutputDim();
     }
     KALDI_ASSERT(InputDim() == nnet_input_sum);
     KALDI_ASSERT(OutputDim() == nnet_output_sum);
   }

   void WriteData(std::ostream &os, bool binary) const {
     // useful dims
     int32 nnet_count = nnet_.size();
     //
     WriteToken(os, binary, "<NestedNnetCount>");
     WriteBasicType(os, binary, nnet_count);
     if (!binary) os << "\n";
     for (int32 i = 0; i < nnet_count; i++) {
       WriteToken(os, binary, "<NestedNnet>");
       WriteBasicType(os, binary, i+1);
       if (!binary) os << "\n";
       nnet_[i].Write(os, binary);
     }
     WriteToken(os, binary, "</ParallelComponent>");
   }

   int32 NumParams() const {
     int32 ans = 0;
     for (int32 i = 0; i < nnet_.size(); i++) {
       ans += nnet_[i].NumParams();
     }
     return ans;
   }

   void GetGradient(VectorBase<BaseFloat>* gradient) const {
     KALDI_ASSERT(gradient->Dim() == NumParams());
     int32 offset = 0;
     for (int32 i = 0; i < nnet_.size(); i++) {
       int32 n_params = nnet_[i].NumParams();
       Vector<BaseFloat> gradient_aux;  // we need 'Vector<>',
       nnet_[i].GetGradient(&gradient_aux);  // copy gradient from Nnet,
       gradient->Range(offset, n_params).CopyFromVec(gradient_aux);
       offset += n_params;
     }
     KALDI_ASSERT(offset == NumParams());
   }

   void GetParams(VectorBase<BaseFloat>* params) const {
     KALDI_ASSERT(params->Dim() == NumParams());
     int32 offset = 0;
     for (int32 i = 0; i < nnet_.size(); i++) {
       int32 n_params = nnet_[i].NumParams();
       Vector<BaseFloat> params_aux;  // we need 'Vector<>',
       nnet_[i].GetParams(&params_aux);  // copy params from Nnet,
       params->Range(offset, n_params).CopyFromVec(params_aux);
       offset += n_params;
     }
     KALDI_ASSERT(offset == NumParams());
   }

   void SetParams(const VectorBase<BaseFloat>& params) {
     KALDI_ASSERT(params.Dim() == NumParams());
     int32 offset = 0;
     for (int32 i = 0; i < nnet_.size(); i++) {
       int32 n_params = nnet_[i].NumParams();
       nnet_[i].SetParams(params.Range(offset, n_params));
       offset += n_params;
     }
     KALDI_ASSERT(offset == NumParams());
   }

   std::string Info() const {
     std::ostringstream os;
     os << "\n";
     for (int32 i = 0; i < nnet_.size(); i++) {
       os << "nested_network #" << i+1 << " {\n"
          << nnet_[i].Info()
          << "}\n";
     }
     std::string s(os.str());
     s.erase(s.end() -1);  // removing last '\n'
     return s;
   }

   std::string InfoGradient() const {
     std::ostringstream os;
     os << "\n";
     for (int32 i = 0; i < nnet_.size(); i++) {
       os << "nested_gradient #" << i+1 << " {\n"
          << nnet_[i].InfoGradient(false)
          << "}\n";
     }
     std::string s(os.str());
     s.erase(s.end() -1);  // removing last '\n'
     return s;
   }

   std::string InfoPropagate() const {
     std::ostringstream os;
     for (int32 i = 0; i < nnet_.size(); i++) {
       os << "nested_propagate #" << i+1 << " {\n"
          << nnet_[i].InfoPropagate(false)
          << "}\n";
     }
     return os.str();
   }

   std::string InfoBackPropagate() const {
     std::ostringstream os;
     for (int32 i = 0; i < nnet_.size(); i++) {
       os << "nested_backpropagate #" << i+1 << " {\n"
          << nnet_[i].InfoBackPropagate(false)
          << "}\n";
     }
     return os.str();
   }

   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // column-offsets for data buffers 'in,out',
     int32 input_offset = 0, output_offset = 0;
     // loop over nnets,
     for (int32 i = 0; i < nnet_.size(); i++) {
       // get the data 'windows',
       CuSubMatrix<BaseFloat> src(
         in.ColRange(input_offset, nnet_[i].InputDim())
       );
       CuSubMatrix<BaseFloat> tgt(
         out->ColRange(output_offset, nnet_[i].OutputDim())
       );
       // forward through auxiliary matrix, as 'Propagate' requires 'CuMatrix',
       CuMatrix<BaseFloat> tgt_aux;
       nnet_[i].Propagate(src, &tgt_aux);
       tgt.CopyFromMat(tgt_aux);
       // advance the offsets,
       input_offset += nnet_[i].InputDim();
       output_offset += nnet_[i].OutputDim();
     }
   }

   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff) {
     // column-offsets for data buffers 'in,out',
     int32 input_offset = 0, output_offset = 0;
     // loop over nnets,
     for (int32 i = 0; i < nnet_.size(); i++) {
       // get the data 'windows',
       CuSubMatrix<BaseFloat> src(
         out_diff.ColRange(output_offset, nnet_[i].OutputDim())
       );
       CuSubMatrix<BaseFloat> tgt(
         in_diff->ColRange(input_offset, nnet_[i].InputDim())
       );
       // ::Backpropagate through auxiliary matrix (CuMatrix in the interface),
       CuMatrix<BaseFloat> tgt_aux;
       nnet_[i].Backpropagate(src, &tgt_aux);
       tgt.CopyFromMat(tgt_aux);
       // advance the offsets,
       input_offset += nnet_[i].InputDim();
       output_offset += nnet_[i].OutputDim();
     }
   }

   void Update(const CuMatrixBase<BaseFloat> &input,
               const CuMatrixBase<BaseFloat> &diff) {
     { }  // do nothing
   }

   void SetTrainOptions(const NnetTrainOptions &opts) {
     for (int32 i = 0; i < nnet_.size(); i++) {
       nnet_[i].SetTrainOptions(opts);
     }
   }

   void SetLearnRateCoef(BaseFloat val) {
     // loop over nnets,
     for (int32 i = 0; i < nnet_.size(); i++) {
       // loop over components,
       for (int32 j = 0; j < nnet_[i].NumComponents(); j++) {
         if (nnet_[i].GetComponent(j).IsUpdatable()) {
           UpdatableComponent& comp =
             dynamic_cast<UpdatableComponent&>(nnet_[i].GetComponent(j));
           // set the value,
           comp.SetLearnRateCoef(val);
         }
       }
     }
   }

   void SetBiasLearnRateCoef(BaseFloat val) {
     // loop over nnets,
     for (int32 i = 0; i < nnet_.size(); i++) {
       // loop over components,
       for (int32 j = 0; j < nnet_[i].NumComponents(); j++) {
         if (nnet_[i].GetComponent(j).IsUpdatable()) {
           UpdatableComponent& comp =
             dynamic_cast<UpdatableComponent&>(nnet_[i].GetComponent(j));
           // set the value,
           comp.SetBiasLearnRateCoef(val);
         }
       }
     }
   }

   void SetSeqLengths(const std::vector<int32> &sequence_lengths) {
     sequence_lengths_ = sequence_lengths;
     // loop over nnets,
     for (int32 i = 0; i < nnet_.size(); i++) {
       nnet_[i].SetSeqLengths(sequence_lengths);
     }
   }

  private:
   std::vector<Nnet> nnet_;
 };

 }  // namespace nnet1
 }  // namespace kaldi

 #endif  // KALDI_NNET_NNET_PARALLEL_COMPONENT_H_
kaldi::nnet1::ParallelComponent::WriteData
void WriteData(std::ostream &os, bool binary) const
Writes the component content.
Definition: nnet-parallel-component.h:134

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::ParallelComponent::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-parallel-component.h:241

kaldi::nnet1::ParallelComponent::Info
std::string Info() const
Print some additional info (after <ComponentName> and the dims),.
Definition: nnet-parallel-component.h:195

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet1::ParallelComponent::InfoBackPropagate
std::string InfoBackPropagate() const
Definition: nnet-parallel-component.h:231

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet1::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters, it contains SGD training hype...
Definition: nnet-component.h:208

kaldi::nnet1::ParallelComponent::NumParams
int32 NumParams() const
Number of trainable parameters,.
Definition: nnet-parallel-component.h:150

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet1::ParallelComponent::SetTrainOptions
void SetTrainOptions(const NnetTrainOptions &opts)
Overriding the default, which was UpdatableComponent::SetTrainOptions(...)
Definition: nnet-parallel-component.h:298

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

nnet-component.h

kaldi::nnet1::ParallelComponent::GetNestedNnet
const Nnet & GetNestedNnet(int32 id) const
Definition: nnet-parallel-component.h:48

kaldi::nnet1::ParallelComponent::GetNestedNnet
Nnet & GetNestedNnet(int32 id)
Definition: nnet-parallel-component.h:49

kaldi::nnet1::ParallelComponent::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-parallel-component.h:46

kaldi::nnet1::UpdatableComponent::SetLearnRateCoef
virtual void SetLearnRateCoef(BaseFloat val)
Set the learn-rate coefficient,.
Definition: nnet-component.h:251

kaldi::nnet1::Component::ComponentType
ComponentType
Component type identification mechanism,.
Definition: nnet-component.h:47

kaldi::nnet1::ParallelComponent::SetParams
void SetParams(const VectorBase< BaseFloat > &params)
Set the trainable parameters from, reshaped as a vector,.
Definition: nnet-parallel-component.h:184

kaldi::nnet1::ParallelComponent
Definition: nnet-parallel-component.h:36

kaldi::nnet1::ParallelComponent::SetSeqLengths
void SetSeqLengths(const std::vector< int32 > &sequence_lengths)
Overriding the default, which was MultistreamComponent::SetSeqLengths(...)
Definition: nnet-parallel-component.h:346

kaldi::nnet1::ParallelComponent::SetBiasLearnRateCoef
void SetBiasLearnRateCoef(BaseFloat val)
Overriding the default, which was UpdatableComponent::SetBiasLearnRateCoef(...)
Definition: nnet-parallel-component.h:327

kaldi::nnet1::ParallelComponent::~ParallelComponent
~ParallelComponent()
Definition: nnet-parallel-component.h:42

kaldi::nnet1::ParallelComponent::ReadData
void ReadData(std::istream &is, bool binary)
Reads the component content.
Definition: nnet-parallel-component.h:109

kaldi::nnet1::ParallelComponent::InfoPropagate
std::string InfoPropagate() const
Definition: nnet-parallel-component.h:221

kaldi::nnet1::UpdatableComponent::SetBiasLearnRateCoef
virtual void SetBiasLearnRateCoef(BaseFloat val)
Set the learn-rate coefficient for bias,.
Definition: nnet-component.h:256

float

kaldi::ExpectToken
void ExpectToken(std::istream &is, bool binary, const char *token)
ExpectToken tries to read in the given token, and throws an exception on failure. ...
Definition: io-funcs.cc:191

kaldi::nnet1::Component::InputDim
int32 InputDim() const
Get the dimension of the input,.
Definition: nnet-component.h:130

kaldi::nnet1::Nnet
Definition: nnet-nnet.h:37

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::nnet1::Nnet::Read
void Read(const std::string &rxfilename)
Read Nnet from &#39;rxfilename&#39;,.
Definition: nnet-nnet.cc:333

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::nnet1::MultistreamComponent
Class MultistreamComponent is an extension of UpdatableComponent for recurrent networks, which are trained with parallel sequences.
Definition: nnet-component.h:281

kaldi::nnet1::ParallelComponent::InfoGradient
std::string InfoGradient() const
Print some additional info about gradient (after <...> and dims),.
Definition: nnet-parallel-component.h:208

kaldi::nnet1::ParallelComponent::ParallelComponent
ParallelComponent(int32 dim_in, int32 dim_out)
Definition: nnet-parallel-component.h:38

kaldi::nnet1::NnetTrainOptions
Definition: nnet-trnopts.h:30

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::CuMatrixBase::ColRange
CuSubMatrix< Real > ColRange(const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Definition: cu-matrix.h:665

cu-math.h

kaldi::nnet1::ParallelComponent::InitData
void InitData(std::istream &is)
Initialize the content of the component by the &#39;line&#39; from the prototype,.
Definition: nnet-parallel-component.h:51

kaldi::nnet1::Component::kParallelComponent
Definition: nnet-component.h:83

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::nnet1::Nnet::Init
void Init(const std::string &proto_file)
Initialize the Nnet from the prototype,.
Definition: nnet-nnet.cc:301

kaldi::nnet1::ParallelComponent::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-parallel-component.h:45

kaldi::nnet1::ParallelComponent::GetParams
void GetParams(VectorBase< BaseFloat > *params) const
Get the trainable parameters reshaped as a vector,.
Definition: nnet-parallel-component.h:171

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet1::ParallelComponent::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-parallel-component.h:264

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet1::Component
Abstract class, building block of the network.
Definition: nnet-component.cc:51

kaldi::nnet1::ParallelComponent::nnet_
std::vector< Nnet > nnet_
Definition: nnet-parallel-component.h:355

kaldi::nnet1::MultistreamComponent::sequence_lengths_
std::vector< int32 > sequence_lengths_
Definition: nnet-component.h:304

kaldi::nnet1::Component::OutputDim
int32 OutputDim() const
Get the dimension of the output,.
Definition: nnet-component.h:135

kaldi::nnet1::ParallelComponent::Update
void Update(const CuMatrixBase< BaseFloat > &input, const CuMatrixBase< BaseFloat > &diff)
Compute gradient and update parameters,.
Definition: nnet-parallel-component.h:289

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

nnet-utils.h

kaldi::nnet1::ParallelComponent::GetGradient
void GetGradient(VectorBase< BaseFloat > *gradient) const
Get gradient reshaped as a vector,.
Definition: nnet-parallel-component.h:158

kaldi::nnet1::ParallelComponent::SetLearnRateCoef
void SetLearnRateCoef(BaseFloat val)
Overriding the default, which was UpdatableComponent::SetLearnRateCoef(...)
Definition: nnet-parallel-component.h:308

kaldi::VectorBase::Range
SubVector< Real > Range(const MatrixIndexT o, const MatrixIndexT l)
Returns a sub-vector of a vector (a range of elements).
Definition: kaldi-vector.h:94