doc/nnet2_2nnet-compute_8cc_source.html

 // nnet2/nnet-compute.cc

 // Copyright 2012   Johns Hopkins University (author: Daniel Povey)
 // Copyright 2015   David Snyder

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "nnet2/nnet-compute.h"
 #include "hmm/posterior.h"

 namespace kaldi {
 namespace nnet2 {

 /*
   This class does the forward and possibly backward computation for (typically)
   a whole utterance of contiguous features.  You'll instantiate one of
   these classes each time you want to do this computation.
 */
 class NnetComputer {
  public:
   /* Initializer.  If pad == true, pad input with nnet.LeftContext() frames on
      the left and nnet.RightContext() frames on the right (duplicate the first
      and last frames.) */
   NnetComputer(const Nnet &nnet,
                const CuMatrixBase<BaseFloat> &input_feats,
                bool pad,
                Nnet *nnet_to_update = NULL);

   void Propagate();

   void Backprop(CuMatrix<BaseFloat> *tmp_deriv);


   BaseFloat ComputeLastLayerDeriv(const Posterior &pdf_post,
                                   CuMatrix<BaseFloat> *deriv) const;

   CuMatrixBase<BaseFloat> &GetOutput() { return forward_data_.back(); }

  private:
   const Nnet &nnet_;
   std::vector<CuMatrix<BaseFloat> > forward_data_;
   Nnet *nnet_to_update_; // May be NULL, if just want objective function
   // but no gradient info or SGD.
   std::vector <ChunkInfo> chunk_info_;
 };

 NnetComputer::NnetComputer(const Nnet &nnet,
                            const CuMatrixBase<BaseFloat> &input_feats,
                            bool pad,
                            Nnet *nnet_to_update):
     nnet_(nnet), nnet_to_update_(nnet_to_update) {
   int32 dim = input_feats.NumCols();
   if (dim != nnet.InputDim()) {
     KALDI_ERR << "Feature dimension is " << dim << " but network expects "
               << nnet.InputDim();
   }
   forward_data_.resize(nnet.NumComponents() + 1);

   int32 left_context = (pad ? nnet_.LeftContext() : 0),
        right_context = (pad ? nnet_.RightContext() : 0);

   int32 num_rows = left_context + input_feats.NumRows() + right_context;
   nnet.ComputeChunkInfo(num_rows, 1, &chunk_info_);

   CuMatrix<BaseFloat> &input(forward_data_[0]);
   input.Resize(num_rows, dim);
   input.Range(left_context, input_feats.NumRows(),
               0, dim).CopyFromMat(input_feats);
   for (int32 i = 0; i < left_context; i++)
     input.Row(i).CopyFromVec(input_feats.Row(0));
   int32 last_row = input_feats.NumRows() - 1;
   for (int32 i = 0; i < right_context; i++)
     input.Row(num_rows - i - 1).CopyFromVec(input_feats.Row(last_row));
 }


 void NnetComputer::Propagate() {
   for (int32 c = 0; c < nnet_.NumComponents(); c++) {
     const Component &component = nnet_.GetComponent(c);
     CuMatrix<BaseFloat> &input = forward_data_[c],
                      &output = forward_data_[c+1];
     component.Propagate(chunk_info_[c], chunk_info_[c+1], input, &output);
     const Component *prev_component = (c == 0 ? NULL : &(nnet_.GetComponent(c-1)));
     bool will_do_backprop = (nnet_to_update_ != NULL),
          keep_last_output = will_do_backprop &&
                              ((c>0 && prev_component->BackpropNeedsOutput()) ||
                               component.BackpropNeedsInput());
     if (!keep_last_output)
       forward_data_[c].Resize(0, 0); // We won't need this data; save memory.
   }
 }

 BaseFloat NnetComputer::ComputeLastLayerDeriv(const Posterior &pdf_post,
                                               CuMatrix<BaseFloat> *deriv) const {
   // TODO: convert this to proper CUDA code, c.f. ComputeObjfAndDeriv
   // in nnet-update.cc (I'm not sure, though, that this code is ever reached.)
   int32 num_components = nnet_.NumComponents();
   double tot_objf = 0.0, tot_weight = 0.0;
   const CuMatrix<BaseFloat> &last_layer_output = forward_data_[num_components];
   int32 num_frames = last_layer_output.NumRows(),
           num_pdfs = last_layer_output.NumCols();
   KALDI_ASSERT(pdf_post.size() == static_cast<size_t>(num_frames));
   deriv->Resize(num_frames, num_pdfs); // will zero it.
   for (int32 i = 0; i < deriv->NumRows(); i++) {
     for (size_t j = 0; j < pdf_post[i].size(); j++) {
       int32 label = pdf_post[i][j].first;
       BaseFloat weight = pdf_post[i][j].second;
       KALDI_ASSERT(label >= 0 && label < num_pdfs);
       BaseFloat this_prob = last_layer_output(i, label);
       KALDI_ASSERT(this_prob > 0.99e-20); // We floored to 1.0e-20 in SoftmaxLayer.
       tot_objf += weight * Log(this_prob);
       tot_weight += weight;
       (*deriv)(i, label) += weight / this_prob; // could be "=", assuming the
       // labels are all distinct.
     }
   }
   KALDI_VLOG(4) << "Objective function is " << (tot_objf/tot_weight) <<
       " per frame over " << tot_weight << " samples.";
   return tot_objf;
 }


 void NnetComputer::Backprop(CuMatrix<BaseFloat> *tmp_deriv) {
   KALDI_ASSERT(nnet_to_update_ != NULL); // Or why do backprop?
   // If later this reasoning changes, we can change this
   // statement and add logic to make component_to_update, below,
   // NULL if necessary.

   for (int32 c = nnet_.NumComponents() - 1; c >= 0; c--) {
     const Component &component = nnet_.GetComponent(c);
     Component *component_to_update = &(nnet_to_update_->GetComponent(c));
     const CuMatrix<BaseFloat>  &input = forward_data_[c],
                             &output = forward_data_[c+1],
                       &output_deriv = *tmp_deriv;
     CuMatrix<BaseFloat> input_deriv;
     component.Backprop(chunk_info_[c], chunk_info_[c+1], input, output, output_deriv,
                        component_to_update, &input_deriv);
     *tmp_deriv = input_deriv;
   }
 }

 void NnetComputation(const Nnet &nnet,
                      const CuMatrixBase<BaseFloat> &input,  // features
                      bool pad_input,
                      CuMatrixBase<BaseFloat> *output) {
   NnetComputer nnet_computer(nnet, input, pad_input, NULL);
   nnet_computer.Propagate();
   output->CopyFromMat(nnet_computer.GetOutput());
 }

 void NnetComputationChunked(const Nnet &nnet,
                      const CuMatrixBase<BaseFloat> &input,  // features
                      int32 chunk_size,
                      CuMatrixBase<BaseFloat> *output) {
   int32 num_rows,
        num_chunks = ceil((BaseFloat)input.NumRows() / chunk_size),
        dim = input.NumCols(),
        left_context = nnet.LeftContext(),
        right_context = nnet.RightContext();
   CuMatrix<BaseFloat> full_input;
   num_rows = left_context + input.NumRows() + right_context;
   full_input.Resize(num_rows, dim);
   full_input.Range(left_context, input.NumRows(),
             0, dim).CopyFromMat(input);
   for (int32 i = 0; i < left_context; i++)
     full_input.Row(i).CopyFromVec(input.Row(0));
   int32 last_row = input.NumRows() - 1;
   for (int32 i = 0; i < right_context; i++)
     full_input.Row(num_rows - i - 1).CopyFromVec(input.Row(last_row));

   for (int32 i = 0; i < num_chunks; i++) {
     int32 index = i * chunk_size,
           offset = std::min(num_rows - chunk_size * i,
                             left_context + chunk_size + right_context);
     CuSubMatrix<BaseFloat> chunk_input(full_input, index, offset, 0, dim);
     CuMatrix<BaseFloat> cu_chunk_input(chunk_input);

     // Note: we have already accounted for input padding, so we pass
     // pad_input==false to the NnetComputer.
     NnetComputer nnet_computer(nnet, cu_chunk_input, false, NULL);
     nnet_computer.Propagate();
     CuMatrix<BaseFloat> cu_chunk_output(nnet_computer.GetOutput());
     CuSubMatrix<BaseFloat> chunk_out(*output, i * chunk_size,
                            cu_chunk_output.NumRows(), 0,
                            cu_chunk_output.NumCols());
     chunk_out.CopyFromMat(cu_chunk_output);
   }
 }

 BaseFloat NnetGradientComputation(const Nnet &nnet,
                                   const CuMatrixBase<BaseFloat> &input,
                                   bool pad_input,
                                   const Posterior &pdf_post,
                                   Nnet *nnet_to_update) {
   NnetComputer nnet_computer(nnet, input, pad_input, nnet_to_update);
   nnet_computer.Propagate();
   CuMatrix<BaseFloat> deriv;
   BaseFloat ans;
   ans = nnet_computer.ComputeLastLayerDeriv(pdf_post, &deriv);
   nnet_computer.Backprop(&deriv);
   return ans;
 }


 } // namespace nnet2
 } // namespace kaldi
kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet2::Nnet::GetComponent
const Component & GetComponent(int32 c) const
Definition: nnet-nnet.cc:141

kaldi::nnet2::Nnet::LeftContext
int32 LeftContext() const
Returns the left-context summed over all the Components...
Definition: nnet-nnet.cc:42

kaldi::nnet2::NnetComputer
Definition: nnet-compute.cc:32

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet2::NnetComputer::Backprop
void Backprop(CuMatrix< BaseFloat > *tmp_deriv)
Definition: nnet-compute.cc:141

kaldi::CuMatrixBase::Row
const CuSubVector< Real > Row(MatrixIndexT i) const
Definition: cu-matrix.h:670

kaldi::nnet2::Component
Abstract class, basic element of the network, it is a box with defined inputs, outputs, and tranformation functions interface.
Definition: nnet-component.h:157

kaldi::nnet2::Component::BackpropNeedsInput
virtual bool BackpropNeedsInput() const
Definition: nnet-component.h:235

kaldi::CuMatrixBase::Range
CuSubMatrix< Real > Range(const MatrixIndexT row_offset, const MatrixIndexT num_rows, const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Definition: cu-matrix.h:653

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet2::NnetComputationChunked
void NnetComputationChunked(const Nnet &nnet, const CuMatrixBase< BaseFloat > &input, int32 chunk_size, CuMatrixBase< BaseFloat > *output)
Does the basic neural net computation, on a sequence of data (e.g.
Definition: nnet-compute.cc:169

kaldi::nnet2::NnetComputer::forward_data_
std::vector< CuMatrix< BaseFloat > > forward_data_
Definition: nnet-compute.cc:58

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet2::NnetComputation
void NnetComputation(const Nnet &nnet, const CuMatrixBase< BaseFloat > &input, bool pad_input, CuMatrixBase< BaseFloat > *output)
Does the basic neural net computation, on a sequence of data (e.g.
Definition: nnet-compute.cc:160

posterior.h

kaldi::nnet2::Nnet::NumComponents
int32 NumComponents() const
Returns number of components– think of this as similar to # of layers, but e.g.
Definition: nnet-nnet.h:69

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::nnet2::NnetComputer::nnet_
const Nnet & nnet_
Definition: nnet-compute.cc:57

nnet-compute.h

kaldi::Log
double Log(double x)
Definition: kaldi-math.h:100

float

kaldi::nnet2::NnetGradientComputation
BaseFloat NnetGradientComputation(const Nnet &nnet, const CuMatrixBase< BaseFloat > &input, bool pad_input, const Posterior &pdf_post, Nnet *nnet_to_update)
Definition: nnet-compute.cc:208

kaldi::nnet2::Nnet::RightContext
int32 RightContext() const
Returns the right-context summed over all the Components...
Definition: nnet-nnet.cc:56

kaldi::nnet2::Nnet
Definition: nnet-nnet.h:63

kaldi::nnet2::Component::Backprop
virtual void Backprop(const ChunkInfo &in_info, const ChunkInfo &out_info, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, Component *to_update, CuMatrix< BaseFloat > *in_deriv) const =0
Perform backward pass propagation of the derivative, and also either update the model (if to_update =...

kaldi::nnet2::NnetComputer::NnetComputer
NnetComputer(const Nnet &nnet, const CuMatrixBase< BaseFloat > &input_feats, bool pad, Nnet *nnet_to_update=NULL)
Definition: nnet-compute.cc:64

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet2::NnetComputer::Propagate
void Propagate()
The forward-through-the-layers part of the computation.
Definition: nnet-compute.cc:95

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::nnet2::Component::Propagate
virtual void Propagate(const ChunkInfo &in_info, const ChunkInfo &out_info, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const =0
Perform forward pass propagation Input->Output.

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::nnet2::NnetComputer::nnet_to_update_
Nnet * nnet_to_update_
Definition: nnet-compute.cc:59

kaldi::nnet2::NnetComputer::ComputeLastLayerDeriv
BaseFloat ComputeLastLayerDeriv(const Posterior &pdf_post, CuMatrix< BaseFloat > *deriv) const
Computes objf derivative at last layer, and returns objective function summed over labels and multipl...
Definition: nnet-compute.cc:111

kaldi::nnet2::Nnet::ComputeChunkInfo
void ComputeChunkInfo(int32 input_chunk_size, int32 num_chunks, std::vector< ChunkInfo > *chunk_info_out) const
Uses the output of the Context() functions of the network, to compute a vector of size NumComponents(...
Definition: nnet-nnet.cc:65

kaldi::nnet2::Component::BackpropNeedsOutput
virtual bool BackpropNeedsOutput() const
Definition: nnet-component.h:237

kaldi::CuMatrix::Resize
void Resize(MatrixIndexT rows, MatrixIndexT cols, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Allocate the memory.
Definition: cu-matrix.cc:50

kaldi::nnet2::Nnet::InputDim
int32 InputDim() const
Dimension of the input features, e.g.
Definition: nnet-nnet.cc:36

kaldi::nnet2::NnetComputer::chunk_info_
std::vector< ChunkInfo > chunk_info_
Definition: nnet-compute.cc:61

kaldi::nnet2::NnetComputer::GetOutput
CuMatrixBase< BaseFloat > & GetOutput()
Definition: nnet-compute.cc:54