doc/nnet-convolutional-component-temp_8h_source.html

 // nnet3/nnet-convolutional-component.h

 // Copyright      2017  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_NNET3_NNET_CONVOLUTIONAL_COMPONENT_H_
 #define KALDI_NNET3_NNET_CONVOLUTIONAL_COMPONENT_H_

 #include "nnet3/nnet-common.h"
 #include "nnet3/nnet-component-itf.h"
 #include "nnet3/natural-gradient-online.h"
 #include "nnet3/convolution.h"
 #include <iostream>

 namespace kaldi {
 namespace nnet3 {


 class TimeHeightConvolutionComponent: public UpdatableComponent {
  public:

   // The use of this constructor should only precede InitFromConfig()
   TimeHeightConvolutionComponent();

   // Copy constructor
   TimeHeightConvolutionComponent(const TimeHeightConvolutionComponent &other);

   virtual int32 InputDim() const;
   virtual int32 OutputDim() const;

   virtual std::string Info() const;
   virtual void InitFromConfig(ConfigLine *cfl);
   virtual std::string Type() const { return "TimeHeightConvolutionComponent"; }
   virtual int32 Properties() const {
     return kUpdatableComponent|kReordersIndexes|kBackpropAdds|
         kBackpropNeedsInput|kInputContiguous|kOutputContiguous;
   }
   virtual void* Propagate(const ComponentPrecomputedIndexes *indexes,
                          const CuMatrixBase<BaseFloat> &in,
                          CuMatrixBase<BaseFloat> *out) const;
   virtual void Backprop(const std::string &debug_info,
                         const ComponentPrecomputedIndexes *indexes,
                         const CuMatrixBase<BaseFloat> &in_value,
                         const CuMatrixBase<BaseFloat> &out_value,
                         const CuMatrixBase<BaseFloat> &out_deriv,
                         void *memo,
                         Component *to_update,
                         CuMatrixBase<BaseFloat> *in_deriv) const;

   virtual void Read(std::istream &is, bool binary);
   virtual void Write(std::ostream &os, bool binary) const;
   virtual Component* Copy() const {
     return new TimeHeightConvolutionComponent(*this);
   }


   // Some functions that are only to be reimplemented for GeneralComponents.

   // This ReorderIndexes function may insert 'blank' indexes (indexes with
   // t == kNoTime) as well as reordering the indexes.  This is allowed
   // behavior of ReorderIndexes functions.
   virtual void ReorderIndexes(std::vector<Index> *input_indexes,
                               std::vector<Index> *output_indexes) const;

   virtual void GetInputIndexes(const MiscComputationInfo &misc_info,
                                const Index &output_index,
                                std::vector<Index> *desired_indexes) const;

   // This function returns true if at least one of the input indexes used to
   // compute this output index is computable.
   virtual bool IsComputable(const MiscComputationInfo &misc_info,
                             const Index &output_index,
                             const IndexSet &input_index_set,
                             std::vector<Index> *used_inputs) const;

   virtual ComponentPrecomputedIndexes* PrecomputeIndexes(
       const MiscComputationInfo &misc_info,
       const std::vector<Index> &input_indexes,
       const std::vector<Index> &output_indexes,
       bool need_backprop) const;

   // Some functions from base-class UpdatableComponent.
   virtual void Scale(BaseFloat scale);
   virtual void Add(BaseFloat alpha, const Component &other);
   virtual void PerturbParams(BaseFloat stddev);
   virtual BaseFloat DotProduct(const UpdatableComponent &other) const;
   virtual int32 NumParameters() const;
   virtual void Vectorize(VectorBase<BaseFloat> *params) const;
   virtual void UnVectorize(const VectorBase<BaseFloat> &params);
   virtual void FreezeNaturalGradient(bool freeze);


   class PrecomputedIndexes: public ComponentPrecomputedIndexes {
    public:
     PrecomputedIndexes() { }
     PrecomputedIndexes(const PrecomputedIndexes &other):
         computation(other.computation) { }
     virtual PrecomputedIndexes *Copy() const;
     virtual void Write(std::ostream &os, bool binary) const;
     virtual void Read(std::istream &os, bool binary);
     virtual std::string Type() const {
       return "TimeHeightConvolutionComponentPrecomputedIndexes";
     }
     virtual ~PrecomputedIndexes() { }

     time_height_convolution::ConvolutionComputation computation;
   };

   void ScaleLinearParams(BaseFloat alpha) { linear_params_.Scale(alpha); }

   void ConsolidateMemory();
  private:

   void Check() const;

   // computes derived parameters required_time_offsets_ and all_time_offsets_.
   void ComputeDerived();

   // Function that updates linear_params_ and bias_params_, which
   // uses the natural gradient code.
   void UpdateNaturalGradient(
       const PrecomputedIndexes &indexes,
       const CuMatrixBase<BaseFloat> &in_value,
       const CuMatrixBase<BaseFloat> &out_deriv);

   // Function that updates linear_params_ and bias_params_, which
   // does not use the natural gradient code.
   void UpdateSimple(
       const PrecomputedIndexes &indexes,
       const CuMatrixBase<BaseFloat> &in_value,
       const CuMatrixBase<BaseFloat> &out_deriv);

   // Function called to initialize linear_params_ if init-unit=true in the config
   // line.
   void InitUnit();

   time_height_convolution::ConvolutionModel model_;

   // all_time_offsets_ is a copy of the corresponding variable in
   // model, stored as a vector instead of as a set for efficiency.
   std::vector<int32> all_time_offsets_;
   // time_offset_required_ is a vector with the same dimension as
   // 'all_time_offsets_', which is true if the corresponding time-offset
   // is a member of model_.required_time_offsets_.
   std::vector<bool> time_offset_required_;

   // the linear parameters of the convolution.
   // dimension is model_.ParamRows() by model.ParamCols(),
   // which equals num-filters-out by
   // (num-filters-in * patch-rows * patch-cols),
   // a.k.a.
   // (num-filters-in * num-time-offsets * num-height-offset).
   CuMatrix<BaseFloat> linear_params_;
   // the bias parameters of the convolution, dimension is
   // model_.num_filters_out.
   CuVector<BaseFloat> bias_params_;


   // Maximum amount of temporary memory in megabytes that is allowed to be used
   // in the convolution computation.  (this is per computation, but it's
   // released immediately after it's used, so it doesn't matter how many there
   // are).
   BaseFloat max_memory_mb_;

   // Controls whether or not the natural-gradient is used.
   // Note: even if this is true, if is_gradient_ (from the
   // UpdatableComponent base class) is true, we'll do the 'simple'
   // update that doesn't include natural gradient.
   bool use_natural_gradient_;

   // Preconditioner for the input space, of dimension linear_params_.NumCols() +
   // 1 (the 1 is for the bias).  As with other natural-gradient objects, it's
   // not stored with the model on disk but is reinitialized each time we start
   // up.
   OnlineNaturalGradient preconditioner_in_;

   // Preconditioner for the output space, of dimension
   // linear_params_.NumRows().
   OnlineNaturalGradient preconditioner_out_;
 };


 class TdnnComponent: public UpdatableComponent {
  public:

   // The use of this constructor should only precede InitFromConfig()
   TdnnComponent();

   // Copy constructor
   TdnnComponent(const TdnnComponent &other);

   virtual int32 InputDim() const {
     return linear_params_.NumCols() / static_cast<int32>(time_offsets_.size());
   }
   virtual int32 OutputDim() const { return linear_params_.NumRows(); }

   virtual std::string Info() const;
   virtual void InitFromConfig(ConfigLine *cfl);
   virtual std::string Type() const { return "TdnnComponent"; }
   virtual int32 Properties() const {
     return kUpdatableComponent|kReordersIndexes|kBackpropAdds|
         (bias_params_.Dim() == 0 ? kPropagateAdds : 0)|
         kBackpropNeedsInput;
   }
   virtual void* Propagate(const ComponentPrecomputedIndexes *indexes,
                          const CuMatrixBase<BaseFloat> &in,
                          CuMatrixBase<BaseFloat> *out) const;
   virtual void Backprop(const std::string &debug_info,
                         const ComponentPrecomputedIndexes *indexes,
                         const CuMatrixBase<BaseFloat> &in_value,
                         const CuMatrixBase<BaseFloat> &out_value,
                         const CuMatrixBase<BaseFloat> &out_deriv,
                         void *memo,
                         Component *to_update,
                         CuMatrixBase<BaseFloat> *in_deriv) const;

   virtual void Read(std::istream &is, bool binary);
   virtual void Write(std::ostream &os, bool binary) const;
   virtual Component* Copy() const {
     return new TdnnComponent(*this);
   }


   // Some functions that are only to be reimplemented for GeneralComponents.

   // This ReorderIndexes function may insert 'blank' indexes (indexes with
   // t == kNoTime) as well as reordering the indexes.  This is allowed
   // behavior of ReorderIndexes functions.
   virtual void ReorderIndexes(std::vector<Index> *input_indexes,
                               std::vector<Index> *output_indexes) const;

   virtual void GetInputIndexes(const MiscComputationInfo &misc_info,
                                const Index &output_index,
                                std::vector<Index> *desired_indexes) const;

   // This function returns true if at least one of the input indexes used to
   // compute this output index is computable.
   virtual bool IsComputable(const MiscComputationInfo &misc_info,
                             const Index &output_index,
                             const IndexSet &input_index_set,
                             std::vector<Index> *used_inputs) const;

   virtual ComponentPrecomputedIndexes* PrecomputeIndexes(
       const MiscComputationInfo &misc_info,
       const std::vector<Index> &input_indexes,
       const std::vector<Index> &output_indexes,
       bool need_backprop) const;

   // Some functions from base-class UpdatableComponent.
   virtual void Scale(BaseFloat scale);
   virtual void Add(BaseFloat alpha, const Component &other);
   virtual void PerturbParams(BaseFloat stddev);
   virtual BaseFloat DotProduct(const UpdatableComponent &other) const;
   virtual int32 NumParameters() const;
   virtual void Vectorize(VectorBase<BaseFloat> *params) const;
   virtual void UnVectorize(const VectorBase<BaseFloat> &params);
   virtual void FreezeNaturalGradient(bool freeze);


   class PrecomputedIndexes: public ComponentPrecomputedIndexes {
    public:
     PrecomputedIndexes() { }
     PrecomputedIndexes(const PrecomputedIndexes &other):
         row_stride(other.row_stride), row_offsets(other.row_offsets) { }
     virtual PrecomputedIndexes *Copy() const;
     virtual void Write(std::ostream &os, bool binary) const;
     virtual void Read(std::istream &os, bool binary);
     virtual std::string Type() const {
       return "TdnnComponentPrecomputedIndexes";
     }
     virtual ~PrecomputedIndexes() { }


     // input_row_stride is the stride (in number of rows) we have to take in the
     // input matrix each time we form a sub-matrix that will be part of the
     // input to the tdnn operation.  Normally this will be 1, but it may be,
     // for example, 3 in layers where we do subsampling.
     int32 row_stride;

     // 'row_offsets' is of the same dimension as time_offsets_.  Each element
     // describes the row offset (in the input matrix) of a sub-matrix, and each.
     // We will append together these sub-matrices (row-wise) to be the input to
     // the affine or linear transform.
     std::vector<int32> row_offsets;
   };

   CuMatrixBase<BaseFloat> &LinearParams() { return linear_params_; }

   // This allows you to resize the vector in order to add a bias where
   // there previously was none-- obviously this should be done carefully.
   CuVector<BaseFloat> &BiasParams() { return bias_params_; }

   BaseFloat OrthonormalConstraint() const { return orthonormal_constraint_; }

   void ConsolidateMemory();
  private:

   // This static function is a utility function that extracts a CuSubMatrix
   // representing a subset of rows of 'input_matrix'.
   // The numpy syntax would be:
   //   return input_matrix[row_offset:row_stride:num_output_rows*row_stride,:]
   static CuSubMatrix<BaseFloat> GetInputPart(
       const CuMatrixBase<BaseFloat> &input_matrix,
       int32 num_output_rows,
       int32 row_stride,
       int32 row_offset);

   // see the definition for more explanation.
   static void ModifyComputationIo(time_height_convolution::ConvolutionComputationIo *io);

   void Check() const;

   // Function that updates linear_params_, and bias_params_ if present, which
   // uses the natural gradient code.
   void UpdateNaturalGradient(
       const PrecomputedIndexes &indexes,
       const CuMatrixBase<BaseFloat> &in_value,
       const CuMatrixBase<BaseFloat> &out_deriv);

   // Function that updates linear_params_, and bias_params_ if present, which
   // does not use the natural gradient code.
   void UpdateSimple(
       const PrecomputedIndexes &indexes,
       const CuMatrixBase<BaseFloat> &in_value,
       const CuMatrixBase<BaseFloat> &out_deriv);


   // time_offsets_ is the list of time-offsets of the input that
   // we append together; it will typically be (-1,0,1) or (-3,0,3).
   std::vector<int32> time_offsets_;

   // the linear parameters of the network; its NumRows() is the output
   // dim, and its NumCols() equals the input dim times time_offsets_.size().
   CuMatrix<BaseFloat> linear_params_;

   // the bias parameters if this is an affine transform, or the empty vector if
   // this is a linear operation (i.e. use-bias == false in the config).
   CuVector<BaseFloat> bias_params_;

   // If nonzero, this controls how we apply an orthonormal constraint to the
   // parameter matrix; see docs for ConstrainOrthonormal() in nnet-utils.h.
   // This class just returns the value via the OrthonormalConstraint() function;
   // it doesn't actually do anything with it directly.
   BaseFloat orthonormal_constraint_;

   // Controls whether or not the natural-gradient is used.  Note: even if this
   // is true, if is_gradient_ (from the UpdatableComponent base class) is true,
   // we'll do the 'simple' update that doesn't include natural gradient.
   bool use_natural_gradient_;

   // Preconditioner for the input space, of dimension linear_params_.NumCols() +
   // 1 (the 1 is for the bias).  As with other natural-gradient objects, it's
   // not stored with the model on disk but is reinitialized each time we start
   // up.
   OnlineNaturalGradient preconditioner_in_;

   // Preconditioner for the output space, of dimension
   // linear_params_.NumRows().
   OnlineNaturalGradient preconditioner_out_;
 };


 class BlockFactorizedTdnnComponent: public TdnnComponent {


   CuMatrixBase<BaseFloat> &ReducedLinearParams() { return reduced_linear_params_; }
   CuMatrixBase<BaseFloat> &BlockParams() { return block_params_; }
  private:

   // Returns the num-cols of each block of parameters in linear_params_.
   inline int32 InputBlockDim() { return }

   inline int32 ParamsPerBlock() { return block_params_.NumCols(); }

   // Returns the num-rows of each block of parameters in linear_params_.
   inline int32 OutputBlockDim() { }
   inline int32 NumInputBlocks() { return reduced_linear_params_.NumCols(); }
   inline int32 NumOutputBlocks() { return reduced_linear_params_.NumRows(); }

   // This function converts from 'standard' form of the linear transform
   // (i.e. the form linear_params_ is in) to 'intermediate' (reordered) form,
   // which is a matrix of dimension
   //        NumInputBlocks()  by
   //        NumOutputBlocks() * OutputBlockDim() * InputBlockDim()
   // where the 3 factors above are displayed in order of greatest to least stride.
   // This is just a call to CopyCols(), done as its own function for documentation
   // and error checking.
   void ConvertToIntermediate(const CuMatrixBase<BaseFloat> &linear_params,
                              CuMatrixBase<BaseFloat> *intermediate_params);

   // This does the inverse transformation to ConvertToIntermediate();
   // see its documentation for details on the input and output formats.
   void ConvertToStandard(const CuMatrixBase<BaseFloat> &intermediate_params,
                          CuMatrixBase<BaseFloat> *linear_params);

   void DecomposeInterm


   // Sets up the arrays to_final_indexes_ and to_intermediate_indexes_.
   void CreateIndexes();

   // Used in ConvertToStandardForm(), set up by CreateIndexes();
   CuArray<int32> to_standard_indexes_;

   // Used in ConvertToIntermediateForm(), set up by CreateIndexes().
   CuArray<int32> to_intermediate_indexes_;


   // reduced_linear_params_ and block_params_ are the 'real' parameters
   // underlying linear_params_.

   // reduced_linear_params_ is of dimension NumInputBlocks() by
   // NumOutputBlocks().  (This definition is circular, but it
   // helps document the meaning).
   CuMatrix<BaseFloat> reduced_linear_params_;

   // block_params_ is of dimension
   //    (OutputBlockDim() * InputBlockDim())  by  ParamsPerBlock().
   // It contains the mapping from compressed vector form of each block,
   // to full matrix form.
   // The InputBlockDim() and OutputBlockDim() are in order of larger
   // to smaller to stride (i.e. the input blocks are on consecutive rows).
   CuMatrix<BaseFloat> block_params_;
 };


 } // namespace nnet3
 } // namespace kaldi


 #endif
kaldi::nnet3::kOutputContiguous
Definition: nnet-component-itf.h:77

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes
Definition: nnet-convolutional-component-temp.h:286

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::nnet3::TimeHeightConvolutionComponent::Check
void Check() const
Definition: nnet-convolutional-component.cc:50

kaldi::nnet3::TimeHeightConvolutionComponent::Vectorize
virtual void Vectorize(VectorBase< BaseFloat > *params) const
Turns the parameters into vector form.
Definition: nnet-convolutional-component.cc:624

kaldi::nnet3::TdnnComponent::PrecomputedIndexes::row_stride
int32 row_stride
Definition: nnet-convolutional-component-temp.h:545

nnet-component-itf.h

nnet-common.h

kaldi::nnet3::TdnnComponent::OrthonormalConstraint
BaseFloat OrthonormalConstraint() const
Definition: nnet-convolutional-component-temp.h:560

kaldi::nnet3::Component
Abstract base-class for neural-net components.
Definition: nnet-component-itf.h:114

kaldi::nnet3::TdnnComponent::time_offsets_
std::vector< int32 > time_offsets_
Definition: nnet-convolutional-component-temp.h:599

kaldi::nnet3::IndexSet
An abstract representation of a set of Indexes.
Definition: nnet-computation-graph.h:322

kaldi::nnet3::TdnnComponent
TdnnComponent is a more memory-efficient alternative to manually splicing several frames of input and...
Definition: nnet-convolutional-component-temp.h:450

kaldi::nnet3::kUpdatableComponent
Definition: nnet-component-itf.h:42

kaldi::nnet3::TimeHeightConvolutionComponent::ScaleLinearParams
void ScaleLinearParams(BaseFloat alpha)
Definition: nnet-convolutional-component-temp.h:302

kaldi::nnet3::time_height_convolution::ConvolutionModel
This comment explains the basic framework used for everything related to time-height convolution...
Definition: convolution.h:125

kaldi::nnet3::TdnnComponent::Copy
virtual Component * Copy() const
Copies component (deep copy).
Definition: nnet-convolutional-component-temp.h:486

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::~PrecomputedIndexes
virtual ~PrecomputedIndexes()
Definition: nnet-convolutional-component-temp.h:297

kaldi::nnet3::time_height_convolution::CreateIndexes
static void CreateIndexes(const std::vector< std::pair< int32, int32 > > &n_x_pairs, int32 t_start, int32 t_step, int32 num_t_values, int32 reorder_t, std::vector< Index > *indexes)
Creates a vector of indexes with a regular structure, according to these specifications.
Definition: convolution.cc:1470

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::Type
virtual std::string Type() const
Definition: nnet-convolutional-component-temp.h:294

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::OnlineNaturalGradient
Keywords for search: natural gradient, naturalgradient, NG-SGD.
Definition: natural-gradient-online.h:414

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::PrecomputedIndexes
PrecomputedIndexes()
Definition: nnet-convolutional-component-temp.h:288

kaldi::nnet3::TimeHeightConvolutionComponent::FreezeNaturalGradient
virtual void FreezeNaturalGradient(bool freeze)
freezes/unfreezes NaturalGradient updates, if applicable (to be overriden by components that use Natu...
Definition: nnet-convolutional-component.cc:642

kaldi::nnet3::TimeHeightConvolutionComponent::GetInputIndexes
virtual void GetInputIndexes(const MiscComputationInfo &misc_info, const Index &output_index, std::vector< Index > *desired_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-convolutional-component.cc:504

kaldi::nnet3::MiscComputationInfo
Definition: nnet-computation.h:55

kaldi::nnet3::TimeHeightConvolutionComponent::UnVectorize
virtual void UnVectorize(const VectorBase< BaseFloat > &params)
Converts the parameters from vector form.
Definition: nnet-convolutional-component.cc:633

kaldi::nnet3::TimeHeightConvolutionComponent::IsComputable
virtual bool IsComputable(const MiscComputationInfo &misc_info, const Index &output_index, const IndexSet &input_index_set, std::vector< Index > *used_inputs) const
This function only does something interesting for non-simple Components, and it exists to make it pos...
Definition: nnet-convolutional-component.cc:519

kaldi::nnet3::TimeHeightConvolutionComponent::linear_params_
CuMatrix< BaseFloat > linear_params_
Definition: nnet-convolutional-component-temp.h:346

kaldi::nnet3::BlockFactorizedTdnnComponent::block_params_
CuMatrix< BaseFloat > block_params_
Definition: nnet-convolutional-component-temp.h:791

kaldi::nnet3::BlockFactorizedTdnnComponent::BlockParams
CuMatrixBase< BaseFloat > & BlockParams()
Definition: nnet-convolutional-component-temp.h:733

kaldi::nnet3::TimeHeightConvolutionComponent::UpdateNaturalGradient
void UpdateNaturalGradient(const PrecomputedIndexes &indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_deriv)
Definition: nnet-convolutional-component.cc:354

kaldi::nnet3::TdnnComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-convolutional-component-temp.h:466

kaldi::nnet3::TdnnComponent::PrecomputedIndexes::PrecomputedIndexes
PrecomputedIndexes()
Definition: nnet-convolutional-component-temp.h:529

kaldi::nnet3::TimeHeightConvolutionComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-convolutional-component.cc:114

kaldi::nnet3::TimeHeightConvolutionComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-convolutional-component.cc:282

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-convolutional-component.cc:560

kaldi::nnet3::TimeHeightConvolutionComponent::preconditioner_out_
OnlineNaturalGradient preconditioner_out_
Definition: nnet-convolutional-component-temp.h:372

kaldi::nnet3::TdnnComponent::PrecomputedIndexes::Type
virtual std::string Type() const
Definition: nnet-convolutional-component-temp.h:535

kaldi::nnet3::TimeHeightConvolutionComponent::all_time_offsets_
std::vector< int32 > all_time_offsets_
Definition: nnet-convolutional-component-temp.h:334

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::Copy
virtual PrecomputedIndexes * Copy() const
Definition: nnet-convolutional-component.cc:648

convolution.h
This file contains some fairly low-level utilities for implementing convolutional neural networks and...

kaldi::nnet3::TdnnComponent::LinearParams
CuMatrixBase< BaseFloat > & LinearParams()
Definition: nnet-convolutional-component-temp.h:554

kaldi::nnet3::TimeHeightConvolutionComponent::Scale
virtual void Scale(BaseFloat scale)
This virtual function when called on – an UpdatableComponent scales the parameters by "scale" when c...
Definition: nnet-convolutional-component.cc:581

kaldi::nnet3::TimeHeightConvolutionComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-convolutional-component.cc:452

kaldi::nnet3::TimeHeightConvolutionComponent::TimeHeightConvolutionComponent
TimeHeightConvolutionComponent()
Definition: nnet-convolutional-component.cc:31

kaldi::nnet3::BlockFactorizedTdnnComponent::OutputBlockDim
int32 OutputBlockDim()
Definition: nnet-convolutional-component-temp.h:742

kaldi::nnet3::TdnnComponent::linear_params_
CuMatrix< BaseFloat > linear_params_
Definition: nnet-convolutional-component-temp.h:603

float

kaldi::nnet3::TdnnComponent::InputDim
virtual int32 InputDim() const
Returns input-dimension of this component.
Definition: nnet-convolutional-component-temp.h:459

kaldi::nnet3::TimeHeightConvolutionComponent::Add
virtual void Add(BaseFloat alpha, const Component &other)
This virtual function when called by – an UpdatableComponent adds the parameters of another updatabl...
Definition: nnet-convolutional-component.cc:591

natural-gradient-online.h

kaldi::nnet3::TimeHeightConvolutionComponent::ComputeDerived
void ComputeDerived()
Definition: nnet-convolutional-component.cc:491

kaldi::nnet3::TdnnComponent::PrecomputedIndexes::PrecomputedIndexes
PrecomputedIndexes(const PrecomputedIndexes &other)
Definition: nnet-convolutional-component-temp.h:530

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::Write
virtual void Write(std::ostream &os, bool binary) const
Definition: nnet-convolutional-component.cc:652

kaldi::nnet3::TdnnComponent::Properties
virtual int32 Properties() const
Return bitmask of the component&#39;s properties.
Definition: nnet-convolutional-component-temp.h:467

kaldi::nnet3::TimeHeightConvolutionComponent::ReorderIndexes
virtual void ReorderIndexes(std::vector< Index > *input_indexes, std::vector< Index > *output_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-convolutional-component.cc:408

kaldi::nnet3::TdnnComponent::BiasParams
CuVector< BaseFloat > & BiasParams()
Definition: nnet-convolutional-component-temp.h:558

kaldi::nnet3::BlockFactorizedTdnnComponent::NumInputBlocks
int32 NumInputBlocks()
Definition: nnet-convolutional-component-temp.h:743

kaldi::nnet3::TimeHeightConvolutionComponent::model_
time_height_convolution::ConvolutionModel model_
Definition: nnet-convolutional-component-temp.h:330

kaldi::nnet3::TimeHeightConvolutionComponent::Properties
virtual int32 Properties() const
Return bitmask of the component&#39;s properties.
Definition: nnet-convolutional-component-temp.h:227

kaldi::nnet3::TimeHeightConvolutionComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-convolutional-component.cc:301

kaldi::nnet3::TimeHeightConvolutionComponent::UpdateSimple
void UpdateSimple(const PrecomputedIndexes &indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_deriv)
Definition: nnet-convolutional-component.cc:334

kaldi::nnet3::TimeHeightConvolutionComponent::InitUnit
void InitUnit()
Definition: nnet-convolutional-component.cc:88

kaldi::nnet3::TimeHeightConvolutionComponent::OutputDim
virtual int32 OutputDim() const
Returns output-dimension of this component.
Definition: nnet-convolutional-component.cc:61

kaldi::nnet3::TdnnComponent::PrecomputedIndexes
Definition: nnet-convolutional-component-temp.h:527

kaldi::nnet3::kBackpropNeedsInput
Definition: nnet-component-itf.h:65

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

kaldi::nnet3::kPropagateAdds
Definition: nnet-component-itf.h:53

kaldi::nnet3::TimeHeightConvolutionComponent::Copy
virtual Component * Copy() const
Copies component (deep copy).
Definition: nnet-convolutional-component-temp.h:245

kaldi::nnet3::BlockFactorizedTdnnComponent
BlockFactorizedTdnnComponent is a modified form of TdnnComponent (which inherits from TdnnComponent) ...
Definition: nnet-convolutional-component-temp.h:727

kaldi::nnet3::TimeHeightConvolutionComponent::DotProduct
virtual BaseFloat DotProduct(const UpdatableComponent &other) const
Computes dot-product between parameters of two instances of a Component.
Definition: nnet-convolutional-component.cc:610

kaldi::nnet3::TimeHeightConvolutionComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-convolutional-component.cc:424

kaldi::nnet3::TimeHeightConvolutionComponent::InputDim
virtual int32 InputDim() const
Returns input-dimension of this component.
Definition: nnet-convolutional-component.cc:57

kaldi::nnet3::kInputContiguous
Definition: nnet-component-itf.h:75

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::PrecomputedIndexes
PrecomputedIndexes(const PrecomputedIndexes &other)
Definition: nnet-convolutional-component-temp.h:289

kaldi::nnet3::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters; it extends the interface of C...
Definition: nnet-component-itf.h:455

kaldi::nnet3::TdnnComponent::use_natural_gradient_
bool use_natural_gradient_
Definition: nnet-convolutional-component-temp.h:618

kaldi::nnet3::TdnnComponent::preconditioner_out_
OnlineNaturalGradient preconditioner_out_
Definition: nnet-convolutional-component-temp.h:628

kaldi::nnet3::TdnnComponent::PrecomputedIndexes::row_offsets
std::vector< int32 > row_offsets
Definition: nnet-convolutional-component-temp.h:551

kaldi::nnet3::time_height_convolution::ConvolutionComputationIo
Definition: convolution.h:380

kaldi::nnet3::TdnnComponent::OutputDim
virtual int32 OutputDim() const
Returns output-dimension of this component.
Definition: nnet-convolutional-component-temp.h:462

kaldi::nnet3::time_height_convolution::ConvolutionComputation
This struct represents the structure of a convolution computation.
Definition: convolution.h:252

kaldi::nnet3::kReordersIndexes
Definition: nnet-component-itf.h:58

kaldi::nnet3::BlockFactorizedTdnnComponent::NumOutputBlocks
int32 NumOutputBlocks()
Definition: nnet-convolutional-component-temp.h:744

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::nnet3::kBackpropAdds
Definition: nnet-component-itf.h:61

kaldi::nnet3::TdnnComponent::preconditioner_in_
OnlineNaturalGradient preconditioner_in_
Definition: nnet-convolutional-component-temp.h:624

kaldi::nnet3::ComponentPrecomputedIndexes
Definition: nnet-component-itf.h:97

kaldi::ConfigLine
This class is responsible for parsing input like hi-there xx=yyy a=b c empty= f-oo=Append(bar, sss) ba_z=123 bing=&#39;a b c&#39; baz="a b c d=&#39;a b&#39; e" and giving you access to the fields, in this case.
Definition: text-utils.h:205

kaldi::CuArray< int32 >

kaldi::nnet3::TimeHeightConvolutionComponent::PerturbParams
virtual void PerturbParams(BaseFloat stddev)
This function is to be used in testing.
Definition: nnet-convolutional-component.cc:600

kaldi::nnet3::TimeHeightConvolutionComponent::bias_params_
CuVector< BaseFloat > bias_params_
Definition: nnet-convolutional-component-temp.h:349

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::Read
virtual void Read(std::istream &os, bool binary)
Definition: nnet-convolutional-component.cc:660

kaldi::nnet3::TimeHeightConvolutionComponent::NumParameters
virtual int32 NumParameters() const
The following new virtual function returns the total dimension of the parameters in this class...
Definition: nnet-convolutional-component.cc:619

kaldi::nnet3::BlockFactorizedTdnnComponent::InputBlockDim
int32 InputBlockDim()
Definition: nnet-convolutional-component-temp.h:737

kaldi::nnet3::BlockFactorizedTdnnComponent::ParamsPerBlock
int32 ParamsPerBlock()
Definition: nnet-convolutional-component-temp.h:739

kaldi::nnet3::TimeHeightConvolutionComponent::ConsolidateMemory
void ConsolidateMemory()
This virtual function relates to memory management, and avoiding fragmentation.
Definition: nnet-convolutional-component.cc:669

kaldi::nnet3::BlockFactorizedTdnnComponent::ReducedLinearParams
CuMatrixBase< BaseFloat > & ReducedLinearParams()
Definition: nnet-convolutional-component-temp.h:732

kaldi::nnet3::BlockFactorizedTdnnComponent::to_standard_indexes_
CuArray< int32 > to_standard_indexes_
Definition: nnet-convolutional-component-temp.h:771

kaldi::nnet3::BlockFactorizedTdnnComponent::to_intermediate_indexes_
CuArray< int32 > to_intermediate_indexes_
Definition: nnet-convolutional-component-temp.h:774

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::nnet3::TimeHeightConvolutionComponent::use_natural_gradient_
bool use_natural_gradient_
Definition: nnet-convolutional-component-temp.h:362

kaldi::nnet3::TimeHeightConvolutionComponent::preconditioner_in_
OnlineNaturalGradient preconditioner_in_
Definition: nnet-convolutional-component-temp.h:368

kaldi::nnet3::TimeHeightConvolutionComponent::time_offset_required_
std::vector< bool > time_offset_required_
Definition: nnet-convolutional-component-temp.h:338

kaldi::nnet3::TdnnComponent::PrecomputedIndexes::~PrecomputedIndexes
virtual ~PrecomputedIndexes()
Definition: nnet-convolutional-component-temp.h:538

kaldi::nnet3::TimeHeightConvolutionComponent
TimeHeightConvolutionComponent implements 2-dimensional convolution where one of the dimensions of co...
Definition: nnet-convolutional-component-temp.h:212

kaldi::nnet3::TimeHeightConvolutionComponent::max_memory_mb_
BaseFloat max_memory_mb_
Definition: nnet-convolutional-component-temp.h:356

kaldi::nnet3::TimeHeightConvolutionComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-convolutional-component-temp.h:226

kaldi::nnet3::TimeHeightConvolutionComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-convolutional-component.cc:65

kaldi::nnet3::TdnnComponent::bias_params_
CuVector< BaseFloat > bias_params_
Definition: nnet-convolutional-component-temp.h:607

kaldi::nnet3::BlockFactorizedTdnnComponent::reduced_linear_params_
CuMatrix< BaseFloat > reduced_linear_params_
Definition: nnet-convolutional-component-temp.h:783

kaldi::nnet3::TdnnComponent::orthonormal_constraint_
BaseFloat orthonormal_constraint_
Definition: nnet-convolutional-component-temp.h:613

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::computation
time_height_convolution::ConvolutionComputation computation
Definition: nnet-convolutional-component-temp.h:299