doc/nnet-rbm_8h_source.html

 // nnet/nnet-rbm.h

 // Copyright 2012-2013  Brno University of Technology (Author: Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_NNET_NNET_RBM_H_
 #define KALDI_NNET_NNET_RBM_H_

 #include <string>

 #include "nnet/nnet-component.h"
 #include "nnet/nnet-nnet.h"
 #include "nnet/nnet-utils.h"
 #include "nnet/nnet-various.h"
 #include "cudamatrix/cu-math.h"

 namespace kaldi {
 namespace nnet1 {

 class RbmBase : public Component {
  public:
   typedef enum {
     Bernoulli,
     Gaussian
   } RbmNodeType;

   RbmBase(int32 dim_in, int32 dim_out):
     Component(dim_in, dim_out)
   { }

   // Inherited from Component::
   // void Propagate(...)
   // virtual void PropagateFnc(...) = 0

   virtual void Reconstruct(
     const CuMatrixBase<BaseFloat> &hid_state,
     CuMatrix<BaseFloat> *vis_probs
   ) = 0;
   virtual void RbmUpdate(
     const CuMatrixBase<BaseFloat> &pos_vis,
     const CuMatrixBase<BaseFloat> &pos_hid,
     const CuMatrixBase<BaseFloat> &neg_vis,
     const CuMatrixBase<BaseFloat> &neg_hid
   ) = 0;

   virtual RbmNodeType VisType() const = 0;
   virtual RbmNodeType HidType() const = 0;

   virtual void WriteAsNnet(std::ostream& os, bool binary) const = 0;

   void SetRbmTrainOptions(const RbmTrainOptions& opts) {
     rbm_opts_ = opts;
   }
   const RbmTrainOptions& GetRbmTrainOptions() const {
     return rbm_opts_;
   }

  protected:
   RbmTrainOptions rbm_opts_;

  private:
   //   as for RBMs we use Reconstruct(.)
   void Backpropagate(const CuMatrixBase<BaseFloat> &in,
                      const CuMatrixBase<BaseFloat> &out,
                      const CuMatrixBase<BaseFloat> &out_diff,
                      CuMatrix<BaseFloat> *in_diff)
   { }
   void BackpropagateFnc(const CuMatrixBase<BaseFloat> &in,
                         const CuMatrixBase<BaseFloat> &out,
                         const CuMatrixBase<BaseFloat> &out_diff,
                         CuMatrixBase<BaseFloat> *in_diff)
   { }
 };


 class Rbm : public RbmBase {
  public:
   Rbm(int32 dim_in, int32 dim_out):
     RbmBase(dim_in, dim_out)
   { }

   ~Rbm()
   { }

   Component* Copy() const {
     return new Rbm(*this);
   }

   ComponentType GetType() const {
     return kRbm;
   }

   void InitData(std::istream &is) {
     // define options,
     std::string vis_type;
     std::string hid_type;
     float vis_bias_mean = 0.0, vis_bias_range = 0.0,
           hid_bias_mean = 0.0, hid_bias_range = 0.0,
           param_stddev = 0.1;
     std::string vis_bias_cmvn_file;  // initialize biases to logit(p_active)
     // parse config,
     std::string token;
     while (is >> std::ws, !is.eof()) {
       ReadToken(is, false, &token);
        if (token == "<VisibleType>") ReadToken(is, false, &vis_type);
       else if (token == "<HiddenType>") ReadToken(is, false, &hid_type);
       else if (token == "<VisibleBiasMean>") ReadBasicType(is, false, &vis_bias_mean);
       else if (token == "<VisibleBiasRange>") ReadBasicType(is, false, &vis_bias_range);
       else if (token == "<HiddenBiasMean>") ReadBasicType(is, false, &hid_bias_mean);
       else if (token == "<HiddenBiasRange>") ReadBasicType(is, false, &hid_bias_range);
       else if (token == "<ParamStddev>") ReadBasicType(is, false, &param_stddev);
       else if (token == "<VisibleBiasCmvnFilename>") ReadToken(is, false, &vis_bias_cmvn_file);
       else KALDI_ERR << "Unknown token " << token << " Typo in config?";
     }

     // Translate the 'node' types,
     if (vis_type == "bern" || vis_type == "Bernoulli") vis_type_ = RbmBase::Bernoulli;
     else if (vis_type == "gauss" || vis_type == "Gaussian") vis_type_ = RbmBase::Gaussian;
     else KALDI_ERR << "Wrong <VisibleType>" << vis_type;
     //
     if (hid_type == "bern" || hid_type == "Bernoulli") hid_type_ = RbmBase::Bernoulli;
     else if (hid_type == "gauss" || hid_type == "Gaussian") hid_type_ = RbmBase::Gaussian;
     else KALDI_ERR << "Wrong <HiddenType>" << hid_type;

     //
     // Initialize trainable parameters,
     //
     // visible-hidden connections,
     vis_hid_.Resize(OutputDim(), InputDim());
     RandGauss(0.0, param_stddev, &vis_hid_);
     // hidden-bias,
     hid_bias_.Resize(OutputDim());
     RandUniform(hid_bias_mean, hid_bias_range, &hid_bias_);
     // visible-bias,
     if (vis_bias_cmvn_file == "") {
       vis_bias_.Resize(InputDim());
       RandUniform(vis_bias_mean, vis_bias_range, &vis_bias_);
     } else {
       KALDI_LOG << "Initializing from <VisibleBiasCmvnFilename> "
                 << vis_bias_cmvn_file;
       // Reading Nnet with 'global-cmvn' components,
       Nnet cmvn;
       cmvn.Read(vis_bias_cmvn_file);
       KALDI_ASSERT(InputDim() == cmvn.InputDim());
       // The parameters from <AddShift> correspond to 'negative' mean values,
       Vector<BaseFloat> p(cmvn.InputDim());
       dynamic_cast<AddShift&>(cmvn.GetComponent(0)).GetParams(&p);
       p.Scale(-1.0);  // 'un-do' negation of mean values,
       p.ApplyFloor(0.0001);
       p.ApplyCeiling(0.9999);
       // Getting the logit,
       Vector<BaseFloat> logit_p(p.Dim());
       for (int32 d = 0; d < p.Dim(); d++) {
         logit_p(d) = Log(p(d)) - Log(1.0 - p(d));
       }
       vis_bias_ = logit_p;
       KALDI_ASSERT(vis_bias_.Dim() == InputDim());
     }
   }


   void ReadData(std::istream &is, bool binary) {
     std::string vis_node_type, hid_node_type;
     ReadToken(is, binary, &vis_node_type);
     ReadToken(is, binary, &hid_node_type);

     if (vis_node_type == "bern") {
       vis_type_ = RbmBase::Bernoulli;
     } else if (vis_node_type == "gauss") {
       vis_type_ = RbmBase::Gaussian;
     }
     if (hid_node_type == "bern") {
       hid_type_ = RbmBase::Bernoulli;
     } else if (hid_node_type == "gauss") {
       hid_type_ = RbmBase::Gaussian;
     }

     vis_hid_.Read(is, binary);
     vis_bias_.Read(is, binary);
     hid_bias_.Read(is, binary);

     KALDI_ASSERT(vis_hid_.NumRows() == output_dim_);
     KALDI_ASSERT(vis_hid_.NumCols() == input_dim_);
     KALDI_ASSERT(vis_bias_.Dim() == input_dim_);
     KALDI_ASSERT(hid_bias_.Dim() == output_dim_);
   }

   void WriteData(std::ostream &os, bool binary) const {
     switch (vis_type_) {
       case Bernoulli : WriteToken(os,binary, "bern"); break;
       case Gaussian  : WriteToken(os,binary, "gauss"); break;
       default : KALDI_ERR << "Unknown type " << vis_type_;
     }
     switch (hid_type_) {
       case Bernoulli : WriteToken(os,binary, "bern"); break;
       case Gaussian  : WriteToken(os,binary, "gauss"); break;
       default : KALDI_ERR << "Unknown type " << hid_type_;
     }
     vis_hid_.Write(os, binary);
     vis_bias_.Write(os, binary);
     hid_bias_.Write(os, binary);
   }


   // Component API
   void PropagateFnc(const CuMatrixBase<BaseFloat> &in,
                     CuMatrixBase<BaseFloat> *out) {
     // pre-fill with bias
     out->AddVecToRows(1.0, hid_bias_, 0.0);
     // multiply by weights^t
     out->AddMatMat(1.0, in, kNoTrans, vis_hid_, kTrans, 1.0);
     // optionally apply sigmoid
     if (hid_type_ == RbmBase::Bernoulli) {
       out->Sigmoid(*out);
     }
   }

   // RBM training API
   void Reconstruct(const CuMatrixBase<BaseFloat> &hid_state,
                    CuMatrix<BaseFloat> *vis_probs) {
     // check the dim
     if (output_dim_ != hid_state.NumCols()) {
       KALDI_ERR << "Nonmatching dims, component:" << output_dim_
                 << " data:" << hid_state.NumCols();
     }
     // optionally allocate buffer
     if (input_dim_ != vis_probs->NumCols() ||
         hid_state.NumRows() != vis_probs->NumRows()) {
       vis_probs->Resize(hid_state.NumRows(), input_dim_);
     }

     // pre-fill with bias
     vis_probs->AddVecToRows(1.0, vis_bias_, 0.0);
     // multiply by weights
     vis_probs->AddMatMat(1.0, hid_state, kNoTrans, vis_hid_, kNoTrans, 1.0);
     // optionally apply sigmoid
     if (vis_type_ == RbmBase::Bernoulli) {
       vis_probs->Sigmoid(*vis_probs);
     }
   }

   void RbmUpdate(const CuMatrixBase<BaseFloat> &pos_vis,
                  const CuMatrixBase<BaseFloat> &pos_hid,
                  const CuMatrixBase<BaseFloat> &neg_vis,
                  const CuMatrixBase<BaseFloat> &neg_hid) {
     // dims
     KALDI_ASSERT(pos_vis.NumRows() == pos_hid.NumRows() &&
            pos_vis.NumRows() == neg_vis.NumRows() &&
            pos_vis.NumRows() == neg_hid.NumRows() &&
            pos_vis.NumCols() == neg_vis.NumCols() &&
            pos_hid.NumCols() == neg_hid.NumCols() &&
            pos_vis.NumCols() == input_dim_ &&
            pos_hid.NumCols() == output_dim_);

     // lazy initialization of buffers
     if ( vis_hid_corr_.NumRows() != vis_hid_.NumRows() ||
          vis_hid_corr_.NumCols() != vis_hid_.NumCols() ||
          vis_bias_corr_.Dim()    != vis_bias_.Dim()    ||
          hid_bias_corr_.Dim()    != hid_bias_.Dim()     ) {
       vis_hid_corr_.Resize(vis_hid_.NumRows(), vis_hid_.NumCols(), kSetZero);
       vis_bias_corr_.Resize(vis_bias_.Dim(), kSetZero);
       hid_bias_corr_.Resize(hid_bias_.Dim(), kSetZero);
     }

     // ANTI-WEIGHT-EXPLOSION PROTECTION (Gaussian-Bernoulli RBM)
     //
     // in the following section we detect that the weights in
     // Gaussian-Bernoulli RBM are almost exploding. The weight
     // explosion is caused by large variance of the reconstructed data,
     // which causes a feed-back loop that keeps increasing the weights.
     //
     // To avoid explosion, the standard-deviation of the visible-data
     // and reconstructed-data should be about the same.
     // The model is particularly sensitive at the very
     // beginning of the CD-1 training.
     //
     // We compute the standard deviations on
     // * 'A' : input mini-batch
     // * 'B' : reconstruction.
     // When 'B > 2*A', we stabilize the training in this way:
     // 1. we scale down the weights and biases by 'A/B',
     // 2. we shrink learning rate by 0.9x,
     // 3. we reset the momentum buffer,
     //
     // A warning message is put to the log. In later stage
     // the learning-rate returns back to its original value.
     //
     // To avoid the issue, we make sure that the weight-matrix
     // is sensibly initialized.
     //
     if (vis_type_ == RbmBase::Gaussian) {
       // check the data have no nan/inf:
       CheckNanInf(pos_vis, "pos_vis");
       CheckNanInf(pos_hid, "pos_hid");
       CheckNanInf(neg_vis, "neg_vis");
       CheckNanInf(neg_hid, "pos_hid");

       // get standard deviations of pos_vis and neg_vis:
       BaseFloat pos_vis_std = ComputeStdDev(pos_vis);
       BaseFloat neg_vis_std = ComputeStdDev(neg_vis);

       // monitor the standard deviation mismatch : data vs. reconstruction
       if (pos_vis_std * 2 < neg_vis_std) {
         // 1) scale-down the weights and biases
         BaseFloat scale = pos_vis_std / neg_vis_std;
         vis_hid_.Scale(scale);
         vis_bias_.Scale(scale);
         hid_bias_.Scale(scale);
         // 2) reduce the learning rate
         rbm_opts_.learn_rate *= 0.9;
         // 3) reset the momentum buffers
         vis_hid_corr_.SetZero();
         vis_bias_corr_.SetZero();
         hid_bias_corr_.SetZero();

         KALDI_WARN << "Mismatch between pos_vis and neg_vis variances, "
                    << "danger of weight explosion."
                    << " a) Reducing weights with scale " << scale
                    << " b) Lowering learning rate to " << rbm_opts_.learn_rate
                    << " [pos_vis_std:" << pos_vis_std
                    << ",neg_vis_std:" << neg_vis_std << "]";
         return; /* i.e. don't update now, the update would be too BIG */
       }
     }
     //
     // End of weight-explosion check


     //  We use these training hyper-parameters
     //
     const BaseFloat lr = rbm_opts_.learn_rate;
     const BaseFloat mmt = rbm_opts_.momentum;
     const BaseFloat l2 = rbm_opts_.l2_penalty;

     //  UPDATE vishid matrix
     //
     //  vishidinc = momentum*vishidinc + ...
     //              epsilonw*( (posprods-negprods)/numcases - weightcost*vishid)
     //
     //  vishidinc[t] = -(epsilonw/numcases)*negprods + momentum*vishidinc[t-1]
     //                 +(epsilonw/numcases)*posprods
     //                 -(epsilonw*weightcost)*vishid[t-1]
     //
     BaseFloat N = static_cast<BaseFloat>(pos_vis.NumRows());
     vis_hid_corr_.AddMatMat(-lr/N, neg_hid, kTrans, neg_vis, kNoTrans, mmt);
     vis_hid_corr_.AddMatMat(+lr/N, pos_hid, kTrans, pos_vis, kNoTrans, 1.0);
     vis_hid_corr_.AddMat(-lr*l2, vis_hid_);
     vis_hid_.AddMat(1.0, vis_hid_corr_);

     //  UPDATE visbias vector
     //
     //  visbiasinc = momentum*visbiasinc +
     //               (epsilonvb/numcases)*(posvisact-negvisact);
     //
     vis_bias_corr_.AddRowSumMat(-lr/N, neg_vis, mmt);
     vis_bias_corr_.AddRowSumMat(+lr/N, pos_vis, 1.0);
     vis_bias_.AddVec(1.0, vis_bias_corr_, 1.0);

     //  UPDATE hidbias vector
     //
     // hidbiasinc = momentum*hidbiasinc +
     //              (epsilonhb/numcases)*(poshidact-neghidact);
     //
     hid_bias_corr_.AddRowSumMat(-lr/N, neg_hid, mmt);
     hid_bias_corr_.AddRowSumMat(+lr/N, pos_hid, 1.0);
     hid_bias_.AddVec(1.0, hid_bias_corr_, 1.0);
   }

   RbmNodeType VisType() const {
     return vis_type_;
   }

   RbmNodeType HidType() const {
     return hid_type_;
   }

   void WriteAsNnet(std::ostream& os, bool binary) const {
     // header,
     WriteToken(os, binary, Component::TypeToMarker(Component::kAffineTransform));
     WriteBasicType(os, binary, OutputDim());
     WriteBasicType(os, binary, InputDim());
     if (!binary) os << "\n";
     // data,
     vis_hid_.Write(os, binary);
     hid_bias_.Write(os, binary);
     // sigmoid activation,
     if (HidType() == Bernoulli) {
       WriteToken(os, binary, Component::TypeToMarker(Component::kSigmoid));
       WriteBasicType(os, binary, OutputDim());
       WriteBasicType(os, binary, OutputDim());
     }
     if (!binary) os << "\n";
   }

  protected:
   CuMatrix<BaseFloat> vis_hid_;
   CuVector<BaseFloat> vis_bias_;
   CuVector<BaseFloat> hid_bias_;

   CuMatrix<BaseFloat> vis_hid_corr_;
   CuVector<BaseFloat> vis_bias_corr_;
   CuVector<BaseFloat> hid_bias_corr_;

   RbmNodeType vis_type_;
   RbmNodeType hid_type_;
 };


 }  // namespace nnet1
 }  // namespace kaldi

 #endif  // KALDI_NNET_NNET_RBM_H_
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet1::Rbm::InitData
void InitData(std::istream &is)
Virtual interface for initialization and I/O,.
Definition: nnet-rbm.h:113

kaldi::nnet1::Rbm::WriteAsNnet
void WriteAsNnet(std::ostream &os, bool binary) const
Definition: nnet-rbm.h:397

kaldi::nnet1::Rbm::hid_bias_
CuVector< BaseFloat > hid_bias_
Vector with biases.
Definition: nnet-rbm.h:418

kaldi::nnet1::Rbm::Copy
Component * Copy() const
Copy component (deep copy),.
Definition: nnet-rbm.h:105

kaldi::nnet1::Rbm::PropagateFnc
void PropagateFnc(const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out)
Abstract interface for propagation/backpropagation.
Definition: nnet-rbm.h:226

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::nnet1::Rbm::hid_bias_corr_
CuVector< BaseFloat > hid_bias_corr_
Vector for bias updates.
Definition: nnet-rbm.h:422

kaldi::nnet1::Component::input_dim_
int32 input_dim_
Data members,.
Definition: nnet-component.h:190

kaldi::nnet1::Rbm::hid_type_
RbmNodeType hid_type_
Definition: nnet-rbm.h:425

kaldi::nnet1::RbmTrainOptions::learn_rate
BaseFloat learn_rate
Definition: nnet-trnopts.h:67

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet1::RbmBase::rbm_opts_
RbmTrainOptions rbm_opts_
Definition: nnet-rbm.h:76

kaldi::nnet1::Rbm::vis_type_
RbmNodeType vis_type_
Definition: nnet-rbm.h:424

kaldi::nnet1::Nnet::InputDim
int32 InputDim() const
Dimensionality on network input (input feature dim.),.
Definition: nnet-nnet.cc:148

kaldi::nnet1::Rbm::vis_hid_
CuMatrix< BaseFloat > vis_hid_
Matrix with neuron weights.
Definition: nnet-rbm.h:416

kaldi::nnet1::RbmTrainOptions::momentum
BaseFloat momentum
Definition: nnet-trnopts.h:68

kaldi::nnet1::Rbm::VisType
RbmNodeType VisType() const
Definition: nnet-rbm.h:389

kaldi::nnet1::Rbm::RbmUpdate
void RbmUpdate(const CuMatrixBase< BaseFloat > &pos_vis, const CuMatrixBase< BaseFloat > &pos_hid, const CuMatrixBase< BaseFloat > &neg_vis, const CuMatrixBase< BaseFloat > &neg_hid)
Definition: nnet-rbm.h:262

kaldi::nnet1::Component::kSigmoid
Definition: nnet-component.h:62

kaldi::nnet1::RandUniform
void RandUniform(BaseFloat mu, BaseFloat range, CuMatrixBase< Real > *mat, struct RandomState *state=NULL)
Fill CuMatrix with random numbers (Uniform distribution): mu = the mean value, range = the &#39;width&#39; of...
Definition: nnet-utils.h:188

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet1::Rbm
Definition: nnet-rbm.h:96

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet1::RbmTrainOptions
Definition: nnet-trnopts.h:65

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

nnet-component.h

kaldi::nnet1::RbmBase::BackpropagateFnc
void BackpropagateFnc(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrixBase< BaseFloat > *in_diff)
Backward pass transformation (to be implemented by descending class...)
Definition: nnet-rbm.h:86

kaldi::nnet1::Component::ComponentType
ComponentType
Component type identification mechanism,.
Definition: nnet-component.h:47

kaldi::nnet1::RbmBase::Bernoulli
Definition: nnet-rbm.h:38

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::nnet1::Component::TypeToMarker
static const char * TypeToMarker(ComponentType t)
Converts component type to marker,.
Definition: nnet-component.cc:84

kaldi::nnet1::RbmTrainOptions::l2_penalty
BaseFloat l2_penalty
Definition: nnet-trnopts.h:72

nnet-various.h

kaldi::nnet1::Rbm::Reconstruct
void Reconstruct(const CuMatrixBase< BaseFloat > &hid_state, CuMatrix< BaseFloat > *vis_probs)
Definition: nnet-rbm.h:239

kaldi::nnet1::AddShift
Adds shift to all the lines of the matrix (can be used for global mean normalization) ...
Definition: nnet-various.h:291

kaldi::nnet1::ComputeStdDev
Real ComputeStdDev(const CuMatrixBase< Real > &mat)
Get the standard deviation of values in the matrix.
Definition: nnet-utils.h:142

kaldi::nnet1::Rbm::GetType
ComponentType GetType() const
Get Type Identification of the component,.
Definition: nnet-rbm.h:109

kaldi::CuMatrixBase::AddVecToRows
void AddVecToRows(Real alpha, const CuVectorBase< Real > &row, Real beta=1.0)
(for each row r of *this), r = alpha * row + beta * r
Definition: cu-matrix.cc:1261

kaldi::Log
double Log(double x)
Definition: kaldi-math.h:100

float

kaldi::CuMatrixBase::Sigmoid
void Sigmoid(const CuMatrixBase< Real > &src)
Set each element to the sigmoid of the corresponding element of "src": element by element...
Definition: cu-matrix.cc:1534

kaldi::nnet1::RbmBase::RbmBase
RbmBase(int32 dim_in, int32 dim_out)
Definition: nnet-rbm.h:42

kaldi::nnet1::RbmBase::VisType
virtual RbmNodeType VisType() const =0

kaldi::nnet1::Rbm::WriteData
void WriteData(std::ostream &os, bool binary) const
Writes the component content.
Definition: nnet-rbm.h:208

kaldi::nnet1::Rbm::HidType
RbmNodeType HidType() const
Definition: nnet-rbm.h:393

kaldi::nnet1::RbmBase
Definition: nnet-rbm.h:35

kaldi::nnet1::RbmBase::HidType
virtual RbmNodeType HidType() const =0

kaldi::nnet1::Component::InputDim
int32 InputDim() const
Get the dimension of the input,.
Definition: nnet-component.h:130

kaldi::nnet1::Component::kAffineTransform
Definition: nnet-component.h:51

kaldi::nnet1::Nnet
Definition: nnet-nnet.h:37

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::nnet1::RandGauss
void RandGauss(BaseFloat mu, BaseFloat sigma, CuMatrixBase< Real > *mat, struct RandomState *state=NULL)
Fill CuMatrix with random numbers (Gaussian distribution): mu = the mean value, sigma = standard devi...
Definition: nnet-utils.h:164

kaldi::nnet1::Nnet::Read
void Read(const std::string &rxfilename)
Read Nnet from &#39;rxfilename&#39;,.
Definition: nnet-nnet.cc:333

kaldi::nnet1::Component::kRbm
Definition: nnet-component.h:69

kaldi::CuMatrixBase::AddMatMat
void AddMatMat(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType transA, const CuMatrixBase< Real > &B, MatrixTransposeType transB, Real beta)
C = alpha * A(^T)*B(^T) + beta * C.
Definition: cu-matrix.cc:1291

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::nnet1::RbmBase::GetRbmTrainOptions
const RbmTrainOptions & GetRbmTrainOptions() const
Get training hyper-parameters from the network.
Definition: nnet-rbm.h:71

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::nnet1::RbmBase::RbmUpdate
virtual void RbmUpdate(const CuMatrixBase< BaseFloat > &pos_vis, const CuMatrixBase< BaseFloat > &pos_hid, const CuMatrixBase< BaseFloat > &neg_vis, const CuMatrixBase< BaseFloat > &neg_hid)=0

kaldi::nnet1::RbmBase::WriteAsNnet
virtual void WriteAsNnet(std::ostream &os, bool binary) const =0

kaldi::nnet1::Component::output_dim_
int32 output_dim_
Dimension of the output of the Component,.
Definition: nnet-component.h:191

cu-math.h

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

nnet-nnet.h

kaldi::nnet1::RbmBase::Backpropagate
void Backpropagate(const CuMatrixBase< BaseFloat > &in, const CuMatrixBase< BaseFloat > &out, const CuMatrixBase< BaseFloat > &out_diff, CuMatrix< BaseFloat > *in_diff)
Definition: nnet-rbm.h:81

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::kSetZero
Definition: matrix-common.h:38

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet1::Rbm::Rbm
Rbm(int32 dim_in, int32 dim_out)
Definition: nnet-rbm.h:98

kaldi::nnet1::RbmBase::Gaussian
Definition: nnet-rbm.h:39

kaldi::nnet1::Rbm::vis_bias_
CuVector< BaseFloat > vis_bias_
Vector with biases.
Definition: nnet-rbm.h:417

kaldi::nnet1::Nnet::GetComponent
const Component & GetComponent(int32 c) const
Component accessor,.
Definition: nnet-nnet.cc:153

kaldi::nnet1::Rbm::vis_bias_corr_
CuVector< BaseFloat > vis_bias_corr_
Vector for bias updates.
Definition: nnet-rbm.h:421

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet1::Component
Abstract class, building block of the network.
Definition: nnet-component.cc:51

kaldi::nnet1::RbmBase::SetRbmTrainOptions
void SetRbmTrainOptions(const RbmTrainOptions &opts)
Set training hyper-parameters to the network and its UpdatableComponent(s)
Definition: nnet-rbm.h:67

kaldi::nnet1::Rbm::vis_hid_corr_
CuMatrix< BaseFloat > vis_hid_corr_
Matrix for linearity updates.
Definition: nnet-rbm.h:420

kaldi::nnet1::Component::OutputDim
int32 OutputDim() const
Get the dimension of the output,.
Definition: nnet-component.h:135

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

nnet-utils.h

kaldi::nnet1::RbmBase::Reconstruct
virtual void Reconstruct(const CuMatrixBase< BaseFloat > &hid_state, CuMatrix< BaseFloat > *vis_probs)=0

kaldi::nnet1::Rbm::~Rbm
~Rbm()
Definition: nnet-rbm.h:102

kaldi::CuMatrix::Resize
void Resize(MatrixIndexT rows, MatrixIndexT cols, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Allocate the memory.
Definition: cu-matrix.cc:50

kaldi::nnet1::CheckNanInf
void CheckNanInf(const CuMatrixBase< Real > &mat, const char *msg="")
Check that matrix contains no nan or inf.
Definition: nnet-utils.h:132

rnnlm::d
double d
Definition: mikolov-rnnlm-lib.cc:64

kaldi::nnet1::Rbm::ReadData
void ReadData(std::istream &is, bool binary)
Reads the component content.
Definition: nnet-rbm.h:182

kaldi::nnet1::RbmBase::RbmNodeType
RbmNodeType
Definition: nnet-rbm.h:37