doc/nnet-general-component_8cc_source.html

 // nnet3/nnet-general-component.cc

 // Copyright      2015  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <iterator>
 #include <sstream>
 #include <iomanip>
 #include "nnet3/nnet-general-component.h"
 #include "nnet3/nnet-computation-graph.h"
 #include "nnet3/nnet-parse.h"

 namespace kaldi {
 namespace nnet3 {

 // used in I/O
 static void CopyPairVector(const CuArray<Int32Pair> &in,
                         std::vector<std::pair<int32, int32> > *out) {
   in.CopyToVec(reinterpret_cast<std::vector<Int32Pair>*>(out));
 }
 // used in I/O
 static void CopyPairVector(const std::vector<std::pair<int32, int32> > &in,
                         CuArray<Int32Pair> *out) {
   const std::vector<Int32Pair> *in_cast =
       reinterpret_cast<const std::vector<Int32Pair>*>(&in);
   out->CopyFromVec(*in_cast);
 }


 //inline
 void DistributeComponent::ComputeInputIndexAndBlock(const Index &output_index,
                                                     Index *input_index,
                                                     int32 *block) const {
   int32 num_blocks = input_dim_ / output_dim_;
   *input_index = output_index;
   int32 output_x = output_index.x, input_x;
   if (output_x >= 0) {
     input_x = output_x / num_blocks;
   } else {
     input_x = (output_x - num_blocks + 1) / num_blocks;
   }
   input_index->x = input_x;
   if (block)
     *block = output_x - (input_x * num_blocks);
 }

 //virtual
 void DistributeComponent::GetInputIndexes(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     std::vector<Index> *desired_indexes) const {
   desired_indexes->resize(1);
   ComputeInputIndexAndBlock(output_index, &((*desired_indexes)[0]), NULL);
 }

 //virtual
 bool DistributeComponent::IsComputable(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     const IndexSet &input_index_set,
     std::vector<Index> *used_inputs) const {
   Index input_index;
   ComputeInputIndexAndBlock(output_index, &input_index, NULL);
   if (!input_index_set(input_index))
     return false;
   if (used_inputs) {
     used_inputs->clear();
     used_inputs->push_back(input_index);
   }
   return true;
 }

 void DistributeComponentPrecomputedIndexes::Write(std::ostream &ostream, bool binary) const {
   WriteToken(ostream, binary, "<DistributeComponentPrecomputedIndexes>");
   WriteToken(ostream, binary, "<Pairs>");
   WriteIntegerPairVector(ostream, binary, pairs);
   WriteToken(ostream, binary, "</DistributeComponentPrecomputedIndexes>");
 }

 void DistributeComponentPrecomputedIndexes::Read(std::istream &istream, bool binary) {
   ExpectOneOrTwoTokens(istream, binary, "<DistributeComponentPrecomputedIndexes>", "<Pairs>");
   ReadIntegerPairVector(istream, binary, &pairs);
   ExpectToken(istream, binary, "</DistributeComponentPrecomputedIndexes>");
 }

 // virtual
 ComponentPrecomputedIndexes* DistributeComponent::PrecomputeIndexes(
     const MiscComputationInfo &, // misc_info
     const std::vector<Index> &input_indexes,
     const std::vector<Index> &output_indexes,
     bool) const {  // the bool is 'need_backprop'- unused.
   unordered_map<Index, int32, IndexHasher> index_to_input_dim;
   int32 num_input_indexes = input_indexes.size(),
       num_output_indexes = output_indexes.size();
   for (int32 i = 0; i < num_input_indexes; i++)
     index_to_input_dim[input_indexes[i]] = i;
   DistributeComponentPrecomputedIndexes *ans = new
       DistributeComponentPrecomputedIndexes;
   ans->pairs.resize(output_indexes.size());

   int32 num_blocks = input_dim_ / output_dim_,
       block_size = input_dim_ / num_blocks;

   for (int32 i = 0; i < num_output_indexes; i++) {
     Index input_index;
     int32 block_index;
     ComputeInputIndexAndBlock(output_indexes[i], &input_index, &block_index);
     unordered_map<Index, int32, IndexHasher>::iterator iter =
         index_to_input_dim.find(input_index);
     if (iter == index_to_input_dim.end())
       KALDI_ERR << "Input index not found (code error)";
     int32 input_row = iter->second;
     ans->pairs[i] = std::pair<int32,int32>(input_row, block_index * block_size);
   }
   return ans;
 }


 void DistributeComponent::ComputeInputPointers(
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in,
     int32 num_output_rows,
     std::vector<const BaseFloat*> *input_pointers) const {
   const DistributeComponentPrecomputedIndexes *indexes =
       dynamic_cast<const DistributeComponentPrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL && "Invalid pointer type");
   KALDI_ASSERT(num_output_rows == static_cast<int32>(indexes->pairs.size()));
   input_pointers->resize(num_output_rows);

   const BaseFloat *input_data = in.Data();
   int32 input_stride = in.Stride();
   const BaseFloat **input_pointers_data = &((*input_pointers)[0]);
   const std::pair<int32, int32> *pairs_data = &(indexes->pairs[0]);
   for (int32 i = 0; i < num_output_rows; i++) {
     input_pointers_data[i] = input_data +
         pairs_data[i].first * input_stride +
         pairs_data[i].second;
   }
 }

 void DistributeComponent::ComputeInputPointers(
     const ComponentPrecomputedIndexes *indexes_in,
     int32 num_output_rows,
     CuMatrixBase<BaseFloat> *in,
     std::vector<BaseFloat*> *input_pointers) const {
   const DistributeComponentPrecomputedIndexes *indexes =
       dynamic_cast<const DistributeComponentPrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL && "Invalid pointer type");
   KALDI_ASSERT(num_output_rows == static_cast<int32>(indexes->pairs.size()));
   input_pointers->resize(num_output_rows);

   BaseFloat *input_data = in->Data();
   int32 input_stride = in->Stride();
   BaseFloat **input_pointers_data = &((*input_pointers)[0]);
   const std::pair<int32, int32> *pairs_data = &(indexes->pairs[0]);
   for (int32 i = 0; i < num_output_rows; i++) {
     input_pointers_data[i] = input_data +
         pairs_data[i].first * input_stride +
         pairs_data[i].second;
   }
 }


 // virtual
 void* DistributeComponent::Propagate(const ComponentPrecomputedIndexes *indexes,
                                     const CuMatrixBase<BaseFloat> &in,
                                     CuMatrixBase<BaseFloat> *out) const {
   KALDI_ASSERT(indexes != NULL &&
                in.NumCols() == input_dim_ && out->NumCols() == output_dim_);
   int32 num_output_rows = out->NumRows();
   std::vector<const BaseFloat*> input_pointers;
   ComputeInputPointers(indexes, in, num_output_rows, &input_pointers);
   CuArray<const BaseFloat*> input_pointers_cuda(input_pointers);
   out->CopyRows(input_pointers_cuda);
   return NULL;
 }

 // virtual
 void DistributeComponent::Backprop(const std::string &debug_info,
                                    const ComponentPrecomputedIndexes *indexes,
                                    const CuMatrixBase<BaseFloat> &, // in_value,
                                    const CuMatrixBase<BaseFloat> &, // out_value
                                    const CuMatrixBase<BaseFloat> &out_deriv,
                                    void *memo,
                                    Component *, // to_update,
                                    CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("DistributeComponent::Backprop");
   if (in_deriv == NULL) return;

   int32 num_blocks = input_dim_ / output_dim_,
       num_output_rows = out_deriv.NumRows();
   if (num_output_rows != in_deriv->NumRows() * num_blocks) {
     // there could be some 'gaps', i.e. some input values that are not ever
     // referred to.  So we need to zero the input.  This would't happen in the
     // setups I plan to use this for.
     in_deriv->SetZero();
   }

   std::vector<BaseFloat*> input_pointers;
   ComputeInputPointers(indexes, num_output_rows, in_deriv, &input_pointers);
   CuArray<BaseFloat*> input_pointers_cuda(input_pointers);
   out_deriv.CopyToRows(input_pointers_cuda);
 }


 void DistributeComponent::Init(int32 input_dim, int32 output_dim) {
   input_dim_ = input_dim;
   output_dim_ = output_dim;
   KALDI_ASSERT(input_dim > 0 && output_dim > 0 && input_dim % output_dim == 0);
 }

 // virtual
 void DistributeComponent::InitFromConfig(ConfigLine *cfl) {
   int32 input_dim, output_dim;
   bool ok = cfl->GetValue("input-dim", &input_dim) &&
       cfl->GetValue("output-dim", &output_dim);
   if (!ok || cfl->HasUnusedValues())
     KALDI_ERR << "Invalid initializer for layer of type "
               << Type() << ": \"" << cfl->WholeLine() << "\"";
   else
     Init(input_dim, output_dim);
 }

 void DistributeComponent::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<DistributeComponent>");
   WriteToken(os, binary, "<InputDim>");
   WriteBasicType(os, binary, input_dim_);
   WriteToken(os, binary, "<OutputDim>");
   WriteBasicType(os, binary, output_dim_);
   WriteToken(os, binary, "</DistributeComponent>");
 }

 void DistributeComponent::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary, "<DistributeComponent>", "<InputDim>");
   ReadBasicType(is, binary, &input_dim_);
   ExpectToken(is, binary, "<OutputDim>");
   ReadBasicType(is, binary, &output_dim_);
   ExpectToken(is, binary, "</DistributeComponent>");
 }


 void StatisticsExtractionComponentPrecomputedIndexes::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<StatisticsExtractionComponentPrecomputedIndexes>");
   WriteToken(os, binary, "<ForwardIndexes>");
   std::vector<std::pair<int32, int32> > pairs_cpu;
   CopyPairVector(forward_indexes, &pairs_cpu);
   WriteIntegerPairVector(os, binary, pairs_cpu);
   WriteToken(os, binary, "<Counts>");
   counts.Write(os, binary);
   WriteToken(os, binary, "<BackwardIndexes>");
   std::vector<int32> backward_indexes_cpu;
   backward_indexes.CopyToVec(&backward_indexes_cpu);
   WriteIntegerVector(os, binary, backward_indexes_cpu);
   WriteToken(os, binary, "</StatisticsExtractionComponentPrecomputedIndexes>");
 }

 void StatisticsExtractionComponentPrecomputedIndexes::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary,
                        "<StatisticsExtractionComponentPrecomputedIndexes>",
                        "<ForwardIndexes>");
   std::vector<std::pair<int32, int32> > pairs_cpu;
   ReadIntegerPairVector(is, binary, &pairs_cpu);
   CopyPairVector(pairs_cpu, &forward_indexes);
   ExpectToken(is, binary, "<Counts>");
   counts.Read(is, binary);
   ExpectToken(is, binary, "<BackwardIndexes>");
   std::vector<int32> backward_indexes_cpu;
   ReadIntegerVector(is, binary, &backward_indexes_cpu);
   backward_indexes.CopyFromVec(backward_indexes_cpu);
   ExpectToken(is, binary, "</StatisticsExtractionComponentPrecomputedIndexes>");
 }

 ComponentPrecomputedIndexes*
 StatisticsExtractionComponent::PrecomputeIndexes(
     const MiscComputationInfo &misc_info,
     const std::vector<Index> &input_indexes,
     const std::vector<Index> &output_indexes,
     bool need_backprop) const {
   int32 num_input_indexes = input_indexes.size(),
       num_output_indexes = output_indexes.size();
   StatisticsExtractionComponentPrecomputedIndexes *ans = new
       StatisticsExtractionComponentPrecomputedIndexes();
   // both input and output indexes are assumed sorted first on
   // n and x, then on t.
   Int32Pair invalid_pair;
   invalid_pair.first = -1;
   invalid_pair.second = -1;
   std::vector<Int32Pair> forward_indexes_cpu(output_indexes.size(),
                                              invalid_pair);
   std::vector<int32> backward_indexes_cpu(input_indexes.size(), -1);
   Vector<BaseFloat> counts_cpu(output_indexes.size());

   // this map maps from Index to the position in 'input_indexes'.
   unordered_map<Index, int32, IndexHasher> index_to_input_pos;
   for (int32 i = 0; i < num_input_indexes; i++)
     index_to_input_pos[input_indexes[i]] = i;

   for (int32 i = 0; i < num_output_indexes; i++) {
     Index output_index = output_indexes[i];
     Index input_index(output_index);
     int32 t = output_index.t,
         t_start = output_period_ * (t / output_period_);
     if (t_start > t)                // could happen for negative t_start due to
       t_start -= output_period_;    // the way modulus works in C.
     int32 t_end = t_start + output_period_;
     for (int32 t = t_start; t < t_end; t += input_period_) {
       input_index.t = t;
       unordered_map<Index, int32, IndexHasher>::iterator iter =
           index_to_input_pos.find(input_index);
       if (iter != index_to_input_pos.end()) {
         int32 input_pos = iter->second;
         if (forward_indexes_cpu[i].first == -1) {
           forward_indexes_cpu[i].first = input_pos;
           forward_indexes_cpu[i].second = input_pos + 1;
           counts_cpu(i) = 1.0;
         } else {
           // the following might fail, for instance, if the sorting
           // of the input or output indexes was not as expected.
           KALDI_ASSERT(forward_indexes_cpu[i].second == input_pos);
           forward_indexes_cpu[i].second++;
           counts_cpu(i) += 1.0;
         }
         KALDI_ASSERT(backward_indexes_cpu[input_pos] == -1);
         backward_indexes_cpu[input_pos] = i;
       }
     }
     KALDI_ASSERT(counts_cpu(i) != 0.0);
   }
   for (int32 i = 0; i < num_input_indexes; i++) {
     KALDI_ASSERT(backward_indexes_cpu[i] != -1);
   }
   ans->forward_indexes = forward_indexes_cpu;
   ans->counts = counts_cpu;
   if (need_backprop)
     ans->backward_indexes = backward_indexes_cpu;
   return ans;
 }

 StatisticsExtractionComponent::StatisticsExtractionComponent():
     input_dim_(-1), input_period_(1), output_period_(1),
     include_variance_(true) { }

 StatisticsExtractionComponent::StatisticsExtractionComponent(
     const StatisticsExtractionComponent &other):
     input_dim_(other.input_dim_),
     input_period_(other.input_period_),
     output_period_(other.output_period_),
     include_variance_(other.include_variance_) {
   Check();
 }

 void StatisticsExtractionComponent::InitFromConfig(ConfigLine *cfl) {
   // input-dim is required.
   bool ok = cfl->GetValue("input-dim", &input_dim_);
   cfl->GetValue("input-period", &input_period_);
   cfl->GetValue("output-period", &output_period_);
   cfl->GetValue("include-variance", &include_variance_);
   if (cfl->HasUnusedValues())
     KALDI_ERR << "Could not process these elements in initializer: "
               << cfl->UnusedValues();
   if (!ok || input_dim_ <= 0 || input_period_ <= 0 || output_period_ <= 0 ||
       (output_period_ % input_period_ != 0))
     KALDI_ERR << "Invalid initializer for layer of type "
               << Type() << ": \"" << cfl->WholeLine() << "\"";
   Check();
 }

 void StatisticsExtractionComponent::Check() const {
   if (!(input_dim_ > 0 && input_period_ > 0 && output_period_ > 0 &&
         (output_period_ % input_period_) == 0))
     KALDI_ERR << "Invalid configuration of StatisticsExtractionComponent";
 }

 void StatisticsExtractionComponent::ReorderIndexes(
     std::vector<Index> *input_indexes,
     std::vector<Index> *output_indexes) const {
     std::sort(input_indexes->begin(), input_indexes->end(),
               IndexLessNxt());
     std::sort(output_indexes->begin(), output_indexes->end(),
               IndexLessNxt());
 }

 bool StatisticsExtractionComponent::IsComputable(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     const IndexSet &input_index_set,
     std::vector<Index> *used_inputs) const {
   Index input_index(output_index);
   int32 t = output_index.t,
       t_start = output_period_ * (t / output_period_);
   if (t_start > t)                // could happen for negative t_start due to
     t_start -= output_period_;    // the way modulus works in C.
   int32 t_end = t_start + output_period_;
   if (!used_inputs) {
     for (int32 t = t_start; t < t_end; t += input_period_) {
       input_index.t = t;
       if (input_index_set(input_index))
         return true;
     }
     return false;
   } else {
     used_inputs->clear();
     bool ans = false;
     for (int32 t = t_start; t < t_end; t += input_period_) {
       input_index.t = t;
       if (input_index_set(input_index)) {
         ans = true;
         used_inputs->push_back(input_index);
       }
     }
     return ans;
   }
 }

 void StatisticsExtractionComponent::GetInputIndexes(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     std::vector<Index> *desired_indexes) const {
   desired_indexes->clear();
   Index input_index(output_index);
   int32 t = output_index.t,
       t_start = output_period_ * (t / output_period_);
   if (t_start > t)                // could happen for negative t due to
     t_start -= output_period_;    // the way modulus works in C
   int32 t_end = t_start + output_period_;
   for (int32 t = t_start; t < t_end; t += input_period_) {
     input_index.t = t;
     desired_indexes->push_back(input_index);
   }
 }


 void* StatisticsExtractionComponent::Propagate(
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in,
     CuMatrixBase<BaseFloat> *out) const {
   KALDI_ASSERT(indexes_in != NULL);
   const StatisticsExtractionComponentPrecomputedIndexes *indexes =
      dynamic_cast<const StatisticsExtractionComponentPrecomputedIndexes*>(
          indexes_in);
   int32 num_rows_out = out->NumRows();
   KALDI_ASSERT(indexes != NULL &&
                indexes->forward_indexes.Dim() == num_rows_out &&
                in.NumCols() == input_dim_ &&
                out->NumCols() == OutputDim());
   out->SetZero();
   // store the counts.
   out->CopyColFromVec(indexes->counts, 0);
   // store the mean stats
   out->ColRange(1, input_dim_).AddRowRanges(in, indexes->forward_indexes);
   if (include_variance_) {
     // store the variance (sum-squared) stats.
     CuMatrix<BaseFloat> in_squared(in);
     in_squared.ApplyPow(2.0);
     out->ColRange(input_dim_ + 1,
                   input_dim_).AddRowRanges(in_squared,
                                            indexes->forward_indexes);
   }
   return NULL;
 }

 void StatisticsExtractionComponent::Backprop(
     const std::string &debug_info,
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in_value,
     const CuMatrixBase<BaseFloat> &, // out_value,
     const CuMatrixBase<BaseFloat> &out_deriv,
     void *memo,
     Component *, // to_update,
     CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("StatisticsExtractionComponent::Backprop");
   KALDI_ASSERT(indexes_in != NULL);
   const StatisticsExtractionComponentPrecomputedIndexes *indexes =
       dynamic_cast<const StatisticsExtractionComponentPrecomputedIndexes*>(indexes_in);
   in_deriv->SetZero();
   in_deriv->AddRows(1.0, out_deriv.ColRange(1, input_dim_),
                     indexes->backward_indexes);
   if (include_variance_) {
     CuMatrix<BaseFloat> variance_deriv(in_value.NumRows(),
                                        in_value.NumCols(),
                                        kUndefined);
     variance_deriv.CopyRows(out_deriv.ColRange(1 + input_dim_, input_dim_),
                             indexes->backward_indexes);
     in_deriv->AddMatMatElements(2.0, variance_deriv, in_value, 1.0);
   }
 }

 void StatisticsExtractionComponent::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary, "<StatisticsExtractionComponent>",
                        "<InputDim>");
   ReadBasicType(is, binary, &input_dim_);
   ExpectToken(is, binary, "<InputPeriod>");
   ReadBasicType(is, binary, &input_period_);
   ExpectToken(is, binary, "<OutputPeriod>");
   ReadBasicType(is, binary, &output_period_);
   ExpectToken(is, binary, "<IncludeVarinance>");
   ReadBasicType(is, binary, &include_variance_);
   ExpectToken(is, binary, "</StatisticsExtractionComponent>");
   Check();
 }

 void StatisticsExtractionComponent::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<StatisticsExtractionComponent>");
   WriteToken(os, binary, "<InputDim>");
   WriteBasicType(os, binary, input_dim_);
   WriteToken(os, binary, "<InputPeriod>");
   WriteBasicType(os, binary, input_period_);
   WriteToken(os, binary, "<OutputPeriod>");
   WriteBasicType(os, binary, output_period_);
   WriteToken(os, binary, "<IncludeVarinance>");
   WriteBasicType(os, binary, include_variance_);
   WriteToken(os, binary, "</StatisticsExtractionComponent>");
 }

 void StatisticsPoolingComponentPrecomputedIndexes::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<StatisticsPoolingComponentPrecomputedIndexes>");
   WriteToken(os, binary, "<ForwardIndexes>");
   std::vector<std::pair<int32, int32> > indexes_cpu;
   CopyPairVector(forward_indexes, &indexes_cpu);
   WriteIntegerPairVector(os, binary, indexes_cpu);
   WriteToken(os, binary, "<BackwardIndexes>");
   CopyPairVector(backward_indexes, &indexes_cpu);
   WriteIntegerPairVector(os, binary, indexes_cpu);
   WriteToken(os, binary, "</StatisticsPoolingComponentPrecomputedIndexes>");
 }

 void StatisticsPoolingComponentPrecomputedIndexes::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary,
                        "<StatisticsPoolingComponentPrecomputedIndexes>",
                        "<ForwardIndexes>");
   std::vector<std::pair<int32, int32> > indexes_cpu;
   ReadIntegerPairVector(is, binary, &indexes_cpu);
   CopyPairVector(indexes_cpu, &forward_indexes);
   ExpectToken(is, binary, "<BackwardIndexes>");
   ReadIntegerPairVector(is, binary, &indexes_cpu);
   CopyPairVector(indexes_cpu, &backward_indexes);
   ExpectToken(is, binary, "</StatisticsPoolingComponentPrecomputedIndexes>");
 }

 void StatisticsPoolingComponent::InitFromConfig(ConfigLine *cfl) {
   bool ok = cfl->GetValue("input-dim", &input_dim_);
   cfl->GetValue("input-period", &input_period_);
   cfl->GetValue("left-context", &left_context_);
   cfl->GetValue("right-context", &right_context_);
   cfl->GetValue("num-log-count-features", &num_log_count_features_);
   cfl->GetValue("output-stddevs", &output_stddevs_);
   cfl->GetValue("variance-floor", &variance_floor_);

   if (cfl->HasUnusedValues())
     KALDI_ERR << "Could not process these elements in initializer: "
               << cfl->UnusedValues();
   // do some basic checks here but Check() will check more completely.
   if (!ok || input_dim_ <= 0 || left_context_ + right_context_ <= 0 ||
       num_log_count_features_ < 0)
     KALDI_ERR << "Invalid initializer for layer of type "
               << Type() << ": \"" << cfl->WholeLine() << "\"";
   Check();
 }

 StatisticsPoolingComponent::StatisticsPoolingComponent():
     input_dim_(-1), input_period_(1), left_context_(-1), right_context_(-1),
     num_log_count_features_(0), output_stddevs_(false),
     variance_floor_(1.0e-10), require_direct_input_(false) { }


 StatisticsPoolingComponent::StatisticsPoolingComponent(
     const StatisticsPoolingComponent &other):
     input_dim_(other.input_dim_), input_period_(other.input_period_),
     left_context_(other.left_context_), right_context_(other.right_context_),
     num_log_count_features_(other.num_log_count_features_),
     output_stddevs_(other.output_stddevs_),
     variance_floor_(other.variance_floor_),
     require_direct_input_(other.require_direct_input_) {
   Check();
 }

 void StatisticsPoolingComponent::Check() const {
   KALDI_ASSERT(input_dim_ > 0);
   KALDI_ASSERT(input_period_ > 0);
   KALDI_ASSERT(left_context_ >= 0 && right_context_ >= 0 &&
                left_context_ + right_context_ > 0);
   KALDI_ASSERT(left_context_ % input_period_ == 0 &&
                right_context_ % input_period_ == 0);
   KALDI_ASSERT(variance_floor_ > 0.0 && variance_floor_ < 1.0);
   KALDI_ASSERT(!output_stddevs_ || (input_dim_ - 1) % 2 == 0);
 }

 void StatisticsPoolingComponent::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary, "<StatisticsPoolingComponent>",
                        "<InputDim>");
   ReadBasicType(is, binary, &input_dim_);
   ExpectToken(is, binary, "<InputPeriod>");
   ReadBasicType(is, binary, &input_period_);
   ExpectToken(is, binary, "<LeftContext>");
   ReadBasicType(is, binary, &left_context_);
   ExpectToken(is, binary, "<RightContext>");
   ReadBasicType(is, binary, &right_context_);
   ExpectToken(is, binary, "<NumLogCountFeatures>");
   ReadBasicType(is, binary, &num_log_count_features_);
   ExpectToken(is, binary, "<OutputStddevs>");
   ReadBasicType(is, binary, &output_stddevs_);
   ExpectToken(is, binary, "<VarianceFloor>");
   ReadBasicType(is, binary, &variance_floor_);
   ExpectToken(is, binary, "</StatisticsPoolingComponent>");
   require_direct_input_ = false;  // This is not written to disk, it's only used
                                   // temporarily, in memory (see
                                   // nnet3-xvector-compute-batched.cc).
   Check();
 }

 void StatisticsPoolingComponent::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<StatisticsPoolingComponent>");
   WriteToken(os, binary, "<InputDim>");
   WriteBasicType(os, binary, input_dim_);
   WriteToken(os, binary, "<InputPeriod>");
   WriteBasicType(os, binary, input_period_);
   WriteToken(os, binary, "<LeftContext>");
   WriteBasicType(os, binary, left_context_);
   WriteToken(os, binary, "<RightContext>");
   WriteBasicType(os, binary, right_context_);
   WriteToken(os, binary, "<NumLogCountFeatures>");
   WriteBasicType(os, binary, num_log_count_features_);
   WriteToken(os, binary, "<OutputStddevs>");
   WriteBasicType(os, binary, output_stddevs_);
   WriteToken(os, binary, "<VarianceFloor>");
   WriteBasicType(os, binary, variance_floor_);
   WriteToken(os, binary, "</StatisticsPoolingComponent>");
 }

 void StatisticsPoolingComponent::ReorderIndexes(
     std::vector<Index> *input_indexes,
     std::vector<Index> *output_indexes) const {
     std::sort(input_indexes->begin(), input_indexes->end(),
               IndexLessNxt());
     std::sort(output_indexes->begin(), output_indexes->end(),
               IndexLessNxt());
 }

 void StatisticsPoolingComponent::GetInputIndexes(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     std::vector<Index> *desired_indexes) const {
   desired_indexes->clear();
   Index input_index(output_index);
   int32 middle_t = output_index.t,
       t_start = middle_t - left_context_,
       t_last = middle_t + right_context_;
   KALDI_ASSERT(middle_t % input_period_ == 0);
   for (int32 t = t_start; t <= t_last; t += input_period_) {
     input_index.t = t;
     desired_indexes->push_back(input_index);
   }
 }

 bool StatisticsPoolingComponent::IsComputable(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     const IndexSet &input_index_set,
     std::vector<Index> *used_inputs) const {
   if (used_inputs)
     used_inputs->clear();
   // you are not supposed to access the output of this component other than at
   // multiples of the input period.  We could make this an error but decided to
   // just have it return false.
   if (output_index.t % input_period_ != 0)
     return false;

   Index input_index(output_index);
   int32 output_t = output_index.t,
       t_start = output_t - left_context_,
       t_last = output_t + right_context_;
   if (!used_inputs) {
     for (int32 t = t_start; t <= t_last; t += input_period_) {
       input_index.t = t;
       if (input_index_set(input_index))
         return true;
     }
     return false;
   } else {
     bool ans = false;
     for (int32 t = t_start; t <= t_last; t += input_period_) {
       input_index.t = t;
       if (input_index_set(input_index)) {
         ans = true;
         used_inputs->push_back(input_index);
       }
     }
     return ans;
   }
 }

 ComponentPrecomputedIndexes*
 StatisticsPoolingComponent::PrecomputeIndexes(
     const MiscComputationInfo &misc_info,
     const std::vector<Index> &input_indexes,
     const std::vector<Index> &output_indexes,
     bool need_backprop) const {
   int32 num_input_indexes = input_indexes.size(),
       num_output_indexes = output_indexes.size();
   StatisticsPoolingComponentPrecomputedIndexes *ans = new
       StatisticsPoolingComponentPrecomputedIndexes();

   Int32Pair invalid_pair;
   invalid_pair.first = -1;
   invalid_pair.second = -1;
   // forward_indexes_cpu[i] will be the (begin, end) of input indexes
   // included in the sum for the i'th output index.
   std::vector<Int32Pair> forward_indexes_cpu(num_output_indexes,
                                              invalid_pair);
   // backward_indexes_cpu[i] will be the (begin, end) of output indexes
   // for which the i'th input index participates in the sum.
   // because of the way the indexes are sorted (and the fact that only
   // required indexes are present at the input), it naturally has this
   // structure [i.e. no gaps in the sets of indexes].
   std::vector<Int32Pair> backward_indexes_cpu(num_input_indexes,
                                               invalid_pair);

   // this map maps from Index to the position in 'input_indexes'.
   unordered_map<Index, int32, IndexHasher> index_to_input_pos;
   for (int32 i = 0; i < num_input_indexes; i++)
     index_to_input_pos[input_indexes[i]] = i;

   for (int32 i = 0; i < num_output_indexes; i++) {
     Index input_index(output_indexes[i]);
     int32 middle_t = input_index.t,
         t_start = middle_t - left_context_,
         t_last = middle_t + right_context_;
     for (int32 t = t_start; t <= t_last; t += input_period_) {
       input_index.t = t;
       unordered_map<Index, int32, IndexHasher>::iterator iter =
           index_to_input_pos.find(input_index);
       if (iter != index_to_input_pos.end()) {
         int32 input_pos = iter->second;
         if (forward_indexes_cpu[i].first == -1) {
           forward_indexes_cpu[i].first = input_pos;
           forward_indexes_cpu[i].second = input_pos + 1;
         } else {
           KALDI_ASSERT(forward_indexes_cpu[i].second == input_pos);
           forward_indexes_cpu[i].second++;
         }
         if (backward_indexes_cpu[input_pos].first == -1) {
           backward_indexes_cpu[input_pos].first = i;
           backward_indexes_cpu[input_pos].second = i + 1;
         } else {
           KALDI_ASSERT(backward_indexes_cpu[input_pos].second == i);
           backward_indexes_cpu[input_pos].second++;
         }
       }
     }
     KALDI_ASSERT(forward_indexes_cpu[i].first != -1);
   }
   for (int32 i = 0; i < num_input_indexes; i++) {
     KALDI_ASSERT(backward_indexes_cpu[i].first != -1);
   }

   ans->forward_indexes = forward_indexes_cpu;
   if (need_backprop)
     ans->backward_indexes = backward_indexes_cpu;
   return ans;
 }

 void* StatisticsPoolingComponent::Propagate(
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in,
     CuMatrixBase<BaseFloat> *out) const {
   out->SetZero();
   KALDI_ASSERT(indexes_in != NULL);
   const StatisticsPoolingComponentPrecomputedIndexes *indexes =
       dynamic_cast<const StatisticsPoolingComponentPrecomputedIndexes*>(indexes_in);
   int32 num_rows_out = out->NumRows();
   KALDI_ASSERT(indexes != NULL &&
                indexes->forward_indexes.Dim() == num_rows_out &&
                in.NumCols() == input_dim_ &&
                out->NumCols() == OutputDim());
   CuVector<BaseFloat> counts(num_rows_out);
   // counts_mat is a fake matrix with one column, containing the counts.
   CuSubMatrix<BaseFloat> counts_mat(counts.Data(), num_rows_out, 1, 1);
   counts_mat.AddRowRanges(in.ColRange(0, 1), indexes->forward_indexes);

   CuSubMatrix<BaseFloat> out_non_count(*out, 0, num_rows_out,
                                        num_log_count_features_, input_dim_ - 1);
   out_non_count.AddRowRanges(in.ColRange(1, input_dim_ - 1),
                              indexes->forward_indexes);
   out_non_count.DivRowsVec(counts);

   if (num_log_count_features_ > 0) {
     counts.ApplyLog();
     CuVector<BaseFloat> ones(num_log_count_features_, kUndefined);
     ones.Set(1.0);
     out->ColRange(0, num_log_count_features_).AddVecVec(1.0, counts, ones);
   }

   if (output_stddevs_) {
     // if this is true, then we assume the input contains x^2 stats as well as x
     // stats, and we want to process them into a standard deviation.
     KALDI_ASSERT((input_dim_ - 1) % 2 == 0);
     int32 feature_dim = (input_dim_ - 1) / 2;
     CuSubMatrix<BaseFloat> mean(*out, 0, num_rows_out,
                                 num_log_count_features_, feature_dim),
         variance(*out, 0, num_rows_out,
                  num_log_count_features_ + feature_dim, feature_dim);
     // subtract mean-squared from average of x^2 to get the variance.
     variance.AddMatMatElements(-1.0, mean, mean, 1.0);
     variance.ApplyFloor(variance_floor_);
     // compute the standard deviation via square root.
     variance.ApplyPow(0.5);
   }
   return NULL;
 }

 void StatisticsPoolingComponent::Backprop(
     const std::string &debug_info,
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in_value,
     const CuMatrixBase<BaseFloat> &out_value,
     const CuMatrixBase<BaseFloat> &out_deriv_in,
     void *memo,
     Component *, // to_update,
     CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("StatisticsPoolingComponent::Backprop");
   KALDI_ASSERT(indexes_in != NULL);
   const StatisticsPoolingComponentPrecomputedIndexes *indexes =
       dynamic_cast<const StatisticsPoolingComponentPrecomputedIndexes*>(
           indexes_in);
   int32 num_rows_out = out_deriv_in.NumRows();
   CuMatrix<BaseFloat> out_deriv(out_deriv_in);
   if (output_stddevs_) {
     // for now we actually ignore the covariance flooring in the backprop- this
     // is an approximation.  Typically the derivatives computed will be quite
     // tiny for floored variances (they should be zero), so it won't affect the
     // derivatives much.
     int32 feature_dim = (input_dim_ - 1) / 2;
     CuSubMatrix<BaseFloat> mean_deriv(out_deriv, 0, num_rows_out,
                                       num_log_count_features_, feature_dim),
         variance_deriv(out_deriv, 0, num_rows_out,
                        num_log_count_features_ + feature_dim, feature_dim),
         mean_value(out_value, 0, num_rows_out,
                    num_log_count_features_, feature_dim),
         stddev_value(out_value, 0, num_rows_out,
                      num_log_count_features_ + feature_dim, feature_dim);
     // we currently have the deriv w.r.t. the stddev.  step 1 is to get it
     // w.r.t. the centered variance.  If the centered variance is s,
     // and the stddev is sqrt(s), then d/ds sqrt(s) = 0.5 / sqrt(s),
     // so we need to multiply variance_deriv by 0.5 / the stddev.
     variance_deriv.DivElements(stddev_value);
     variance_deriv.Scale(0.5);

     // the deriv w.r.t. the uncentered variance is the same as w.r.t.  the
     // uncentered variance (since they difer by a constant term of -(mean *
     // mean), but we need to add to dF/dmean, the value -2.0 * mean *
     // dF/dvariance.
     mean_deriv.AddMatMatElements(-2.0, mean_value, variance_deriv, 1.0);
   }
   // now we have to account for the effect of division by the count, on
   // the derivative.
   CuVector<BaseFloat> counts(num_rows_out, kUndefined);
   if (num_log_count_features_ > 0) {
     counts.CopyColFromMat(out_value, 0);
     counts.ApplyExp();
   } else {
     counts.SetZero();
     // we need to recompute the counts from the input since they are not in the
     // output.  The submatrix initializer below takes num-rows, num-cols,
     // stride;  num-cols and stride are 1.
     CuSubMatrix<BaseFloat> counts_mat(counts.Data(), num_rows_out, 1, 1);
     counts_mat.AddRowRanges(in_value.ColRange(0, 1), indexes->forward_indexes);
   }
   // Divide the output derivative by the counts.  This is what we want as it
   // concerns the mean and x^2 stats.  As for the counts themselves, the
   // derivative will end up being discarded when we backprop to the
   // StatisticsExtractionComponent (as the count is not differentiable) so it
   // doesn't really matter.
   out_deriv.DivRowsVec(counts);

   // Now propagate the derivative back to the input.  we don't propagate it
   // back for the count's row since it's non-differentiable.
   in_deriv->ColRange(1, input_dim_ - 1).
       AddRowRanges(out_deriv.ColRange(num_log_count_features_, input_dim_ - 1),
                    indexes->backward_indexes);
 }

 // virtual
 void BackpropTruncationComponent::Read(std::istream &is, bool binary) {
   // might not see the "<NaturalGradientAffineComponent>" part because
   // of how ReadNew() works.
   ExpectOneOrTwoTokens(is, binary, "<BackpropTruncationComponent>",
                        "<Dim>");
   ReadBasicType(is, binary, &dim_);
   std::string tok;
   ReadToken(is, binary, &tok);
   if (tok == "<Scale>") {
     ReadBasicType(is, binary, &scale_);
     ReadToken(is, binary, &tok);
   } else {
     scale_ = 1.0;
   }
   KALDI_ASSERT(tok == "<ClippingThreshold>");
   ReadBasicType(is, binary, &clipping_threshold_);
   ExpectToken(is, binary, "<ZeroingThreshold>");
   ReadBasicType(is, binary, &zeroing_threshold_);
   ExpectToken(is, binary, "<ZeroingInterval>");
   ReadBasicType(is, binary, &zeroing_interval_);
   ExpectToken(is, binary, "<RecurrenceInterval>");
   ReadBasicType(is, binary, &recurrence_interval_);
   ExpectToken(is, binary, "<NumElementsClipped>");
   ReadBasicType(is, binary, &num_clipped_);
   ExpectToken(is, binary, "<NumElementsZeroed>");
   ReadBasicType(is, binary, &num_zeroed_);
   ExpectToken(is, binary, "<NumElementsProcessed>");
   ReadBasicType(is, binary, &count_);
   ExpectToken(is, binary, "<NumZeroingBoundaries>");
   ReadBasicType(is, binary, &count_zeroing_boundaries_);
   ExpectToken(is, binary, "</BackpropTruncationComponent>");
 }

 // virtual
 void BackpropTruncationComponent::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<BackpropTruncationComponent>");
   WriteToken(os, binary, "<Dim>");
   WriteBasicType(os, binary, dim_);
   WriteToken(os, binary, "<Scale>");
   WriteBasicType(os, binary, scale_);
   WriteToken(os, binary, "<ClippingThreshold>");
   WriteBasicType(os, binary, clipping_threshold_);
   WriteToken(os, binary, "<ZeroingThreshold>");
   WriteBasicType(os, binary, zeroing_threshold_);
   WriteToken(os, binary, "<ZeroingInterval>");
   WriteBasicType(os, binary, zeroing_interval_);
   WriteToken(os, binary, "<RecurrenceInterval>");
   WriteBasicType(os, binary, recurrence_interval_);
   WriteToken(os, binary, "<NumElementsClipped>");
   WriteBasicType(os, binary, num_clipped_);
   WriteToken(os, binary, "<NumElementsZeroed>");
   WriteBasicType(os, binary, num_zeroed_);
   WriteToken(os, binary, "<NumElementsProcessed>");
   WriteBasicType(os, binary, count_);
   WriteToken(os, binary, "<NumZeroingBoundaries>");
   WriteBasicType(os, binary, count_zeroing_boundaries_);
   WriteToken(os, binary, "</BackpropTruncationComponent>");
 }

 void BackpropTruncationComponentPrecomputedIndexes::Write(std::ostream &ostream,
     bool binary) const {
   WriteToken(ostream, binary,
              "<BackpropTruncationComponentPrecomputedIndexes>");
   WriteToken(ostream, binary, "<Zeroing>");
   zeroing.Write(ostream, binary);
   WriteToken(ostream, binary, "<ZeroingSum>");
   WriteBasicType(ostream, binary, zeroing_sum);
   WriteToken(ostream, binary,
              "</BackpropTruncationComponentPrecomputedIndexes>");
 }

 void BackpropTruncationComponentPrecomputedIndexes::Read(std::istream &istream,
     bool binary) {
   ExpectOneOrTwoTokens(istream, binary,
                        "<BackpropTruncationComponentPrecomputedIndexes>",
                        "<Zeroing>");
   zeroing.Read(istream, binary);
   ExpectToken(istream, binary, "<ZeroingSum>");
   ReadBasicType(istream, binary, &zeroing_sum);
   ExpectToken(istream, binary,
               "</BackpropTruncationComponentPrecomputedIndexes>");
 }

 std::string BackpropTruncationComponent::Info() const {
   std::ostringstream stream;
   stream << Type() << ", dim=" << dim_
          << ", scale=" << scale_
          << ", count=" << std::setprecision(3) << count_ << std::setprecision(6)
          << ", recurrence-interval=" << recurrence_interval_
          << ", clipping-threshold=" << clipping_threshold_
          << ", clipped-proportion="
          << (count_ > 0.0 ? num_clipped_ / count_ : 0)
          << ", zeroing-threshold=" << zeroing_threshold_
          << ", zeroing-interval=" << zeroing_interval_
          << ", zeroed-proportion="
          << (count_zeroing_boundaries_ > 0.0 ?
              num_zeroed_ / count_zeroing_boundaries_ : 0)
          << ", count-zeroing-boundaries="
          << static_cast<int32>(count_zeroing_boundaries_);
   return stream.str();
 }

 void BackpropTruncationComponent::Init(
     int32 dim, BaseFloat scale, BaseFloat clipping_threshold,
     BaseFloat zeroing_threshold, int32 zeroing_interval,
     int32 recurrence_interval) {
   KALDI_ASSERT(clipping_threshold >= 0 && zeroing_threshold >= 0 &&
                scale > 0.0 && zeroing_interval > 0 &&
                recurrence_interval > 0 && dim > 0);
   dim_ = dim;
   scale_ = scale;
   clipping_threshold_ = clipping_threshold;
   zeroing_threshold_ = zeroing_threshold;
   zeroing_interval_ = zeroing_interval;
   recurrence_interval_ = recurrence_interval;
   num_clipped_ = 0.0;
   num_zeroed_ = 0.0;
   count_ = 0.0;
   count_zeroing_boundaries_ = 0.0;
 }

 // virtual
 void BackpropTruncationComponent::InitFromConfig(ConfigLine *cfl) {
   int32 dim = 0;
   bool ok = cfl->GetValue("dim", &dim);
   BaseFloat scale = 1.0,
       clipping_threshold = 30.0,
       zeroing_threshold = 15.0;
   int32 zeroing_interval = 20, recurrence_interval = 1;
   cfl->GetValue("scale", &scale);
   cfl->GetValue("clipping-threshold", &clipping_threshold);
   cfl->GetValue("zeroing-threshold", &zeroing_threshold);
   cfl->GetValue("zeroing-interval", &zeroing_interval);
   cfl->GetValue("recurrence-interval", &recurrence_interval);
   if (!ok || cfl->HasUnusedValues() ||
       clipping_threshold < 0 || zeroing_threshold < 0 || zeroing_interval < 1 ||
       recurrence_interval < 1 || dim <= 0)
     KALDI_ERR << "Invalid initializer for layer of type "
               << Type() << ": \"" << cfl->WholeLine() << "\"";
   Init(dim, scale, clipping_threshold, zeroing_threshold,
       zeroing_interval, recurrence_interval);
 }

 // virtual
 Component* BackpropTruncationComponent::Copy() const {
   BackpropTruncationComponent *ans = new BackpropTruncationComponent();
   ans->dim_ = dim_;
   ans->scale_ = scale_;
   ans->clipping_threshold_ = clipping_threshold_;
   ans->zeroing_threshold_ = zeroing_threshold_;
   ans->zeroing_interval_ = zeroing_interval_;
   ans->recurrence_interval_ = recurrence_interval_;
   ans->num_clipped_ = num_clipped_;
   ans->num_zeroed_ = num_zeroed_;
   ans->count_ = count_;
   ans->count_zeroing_boundaries_ = count_zeroing_boundaries_;
   return ans;
 }

 // virtual
 ComponentPrecomputedIndexes*
 BackpropTruncationComponent::PrecomputeIndexes(
     const MiscComputationInfo &misc_info,
     const std::vector<Index> &input_indexes,
     const std::vector<Index> &output_indexes,
     bool need_backprop) const {
   int32 num_input_indexes = input_indexes.size(),
       num_output_indexes = output_indexes.size();
   KALDI_ASSERT(num_input_indexes == num_output_indexes);
   Vector<BaseFloat> zeroing_cpu(num_output_indexes);

   for (int32 i = 0; i < num_output_indexes; i++) {
     const int32 output_n = output_indexes[i].n;
     const int32 output_t = output_indexes[i].t;
     // checks if output_t crosses a boundary that is a multiple of
     // zeroing_interval_. Note that frame (output_t - recurrence_interval_) is
     // right before frame output_t in RNNs. If the range
     // [output_t - recurrence_interval_, output_t] contains a multiple of
     // zeroing_interval_, then frame output_t crosses the boundary.
     // output_n is used to shift where we put the boundary, so that
     // we don't always zero out gradients on frame 0. It will help avoid
     // learning utterance-boundary effects.
     if (DivideRoundingDown(output_t - output_n, zeroing_interval_) !=
         DivideRoundingDown(output_t - recurrence_interval_ - output_n,
         zeroing_interval_))
       zeroing_cpu(i) = -1.0;
   }

   BackpropTruncationComponentPrecomputedIndexes *ans = new
       BackpropTruncationComponentPrecomputedIndexes();
   ans->zeroing = zeroing_cpu;
   ans->zeroing_sum = -zeroing_cpu.Sum();
   return ans;
 }

 // virtual
 void* BackpropTruncationComponent::Propagate(
                                  const ComponentPrecomputedIndexes *indexes,
                                  const CuMatrixBase<BaseFloat> &in,
                                  CuMatrixBase<BaseFloat> *out) const {
   out->CopyFromMat(in);
   if (scale_ != 1.0)
     out->Scale(scale_);
   return NULL;
 }

 // virtual
 void BackpropTruncationComponent::Backprop(const std::string &debug_info,
                              const ComponentPrecomputedIndexes *indexes_in,
                              const CuMatrixBase<BaseFloat> &, //in_value
                              const CuMatrixBase<BaseFloat> &,
                              const CuMatrixBase<BaseFloat> &out_deriv,
                              void *memo,
                              Component *to_update_in, // may be NULL; may be
                              // identical to "this" or different.
                              CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("BackpropTruncationComponent::Backprop");
   const BackpropTruncationComponentPrecomputedIndexes *indexes =
       dynamic_cast<const BackpropTruncationComponentPrecomputedIndexes*>(
           indexes_in);
   KALDI_ASSERT(indexes->zeroing.Dim() == out_deriv.NumRows());
   // the following statement will do nothing if in_deriv and out_deriv have same
   // memory.
   in_deriv->CopyFromMat(out_deriv);
   if (scale_ != 1.0)
     in_deriv->Scale(scale_);

   BackpropTruncationComponent *to_update =
       dynamic_cast<BackpropTruncationComponent*>(to_update_in);

   // computes clipping_scales
   BaseFloat clipping_threshold =
       (clipping_threshold_ <= 0.0 ? 1.0e+10 : clipping_threshold_);
   // each row in the derivative matrix, which corresponds to one sample in
   // the mini-batch, is scaled to have a max-norm of clipping_threshold_
   CuVector<BaseFloat> clipping_scales(in_deriv->NumRows());
   clipping_scales.AddDiagMat2(pow(clipping_threshold, -2), *in_deriv,
                               kNoTrans, 0.0);
   // now clipping_scales contains the squared (norm of each row divided by
   //  clipping_threshold)
   int32 num_not_scaled;
   clipping_scales.ApplyFloor(1.0, &num_not_scaled);
   // now clipping_scales contains min(1, squared-(norm/clipping_threshold))
   clipping_scales.ApplyPow(-0.5);
   // now clipping_scales contains max(1, clipping_threshold/vector_norm)
   if (to_update != NULL) {
     to_update->num_clipped_ += (clipping_scales.Dim() - num_not_scaled);
     to_update->count_ += clipping_scales.Dim();
   }

   // computes zeroing_scales
   BaseFloat zeroing_threshold =
       (zeroing_threshold_ <= 0.0 ? 1.0e+10 : zeroing_threshold_);
   // zeroing_scales_vec is actually a 1-row matrix.  (the ApplyHeaviside
   // function isn't defined for vectors).
   CuMatrix<BaseFloat> zeroing_scales(1, in_deriv->NumRows());
   CuSubVector<BaseFloat> zeroing_scales_vec(zeroing_scales, 0);
   zeroing_scales_vec.Set(-pow(zeroing_threshold, 2));
   // now zeroing_scales_vec contains -(squared zeroing_threshold)
   zeroing_scales_vec.AddDiagMat2(1.0, *in_deriv, kNoTrans, 1.0);
   // now zeroing_scales_vec contains squared norm of each row -
   // squared zeroing_threshold
   zeroing_scales.ApplyHeaviside();
   // now the element of zeroing_scales_vec is 1.0 if its corresponding
   // sample's norm exceeds zero_threshold, and 0.0 otherwise
   zeroing_scales_vec.MulElements(indexes->zeroing);
   // now the element of zeroing_scales_vec is -1.0 if we want to zero its
   // corresponding sample's gradient, and 0.0 otherwise
   if (to_update != NULL) {
     to_update->num_zeroed_ -= zeroing_scales_vec.Sum(); // since it is negative
     to_update->count_zeroing_boundaries_ += indexes->zeroing_sum;
   }
   zeroing_scales_vec.Add(1.0);
   // now the element of zeroing_scales_vec is 0.0 if we want to zero its
   // corresponding sample's gradient, and 1.0 otherwise

   // combines clipping_scales and zeroing_scales and applies combined_scales
   // to in_deriv all at once
   CuVector<BaseFloat> combined_scales(clipping_scales);
   combined_scales.MulElements(zeroing_scales_vec);
   in_deriv->MulRowsVec(combined_scales);
 }

 // virtual
 void BackpropTruncationComponent::ZeroStats()  {
   count_ = 0.0;
   count_zeroing_boundaries_ = 0.0;
   num_clipped_ = 0.0;
   num_zeroed_ = 0.0;
 }

 // virtual
 void BackpropTruncationComponent::Scale(BaseFloat scale) {
   count_ *= scale;
   count_zeroing_boundaries_ *= scale;
   num_clipped_ *= scale;
   num_zeroed_ *= scale;
 }

 // virtual
 void BackpropTruncationComponent::Add(BaseFloat alpha,
                                       const Component &other_in) {
   const BackpropTruncationComponent *other =
       dynamic_cast<const BackpropTruncationComponent*>(&other_in);
   KALDI_ASSERT(other != NULL);
   count_ += alpha * other->count_;
   count_zeroing_boundaries_ += alpha * other->count_zeroing_boundaries_;
   num_clipped_ += alpha * other->num_clipped_;
   num_zeroed_ += alpha * other->num_zeroed_;
 }


 std::string ConstantComponent::Info() const {
   std::ostringstream stream;
   stream << UpdatableComponent::Info()
          << ", " << Type()
          << ", output-dim=" << OutputDim()
          << ", is-updatable=" << std::boolalpha << is_updatable_
          << ", use-natural-gradient=" << std::boolalpha
          << use_natural_gradient_;
   PrintParameterStats(stream, "output", output_, true);
   return stream.str();
 }

 ConstantComponent::ConstantComponent():
     UpdatableComponent(), is_updatable_(true),
     use_natural_gradient_(true) { }

 ConstantComponent::ConstantComponent(
     const ConstantComponent &other):
     UpdatableComponent(other), output_(other.output_),
     is_updatable_(other.is_updatable_),
     use_natural_gradient_(other.use_natural_gradient_),
     preconditioner_(other.preconditioner_) { }

 void* ConstantComponent::Propagate(
     const ComponentPrecomputedIndexes *indexes,
     const CuMatrixBase<BaseFloat> &in,
     CuMatrixBase<BaseFloat> *out) const {
   out->CopyRowsFromVec(output_);
   return NULL;
 }

 void ConstantComponent::Backprop(
     const std::string &debug_info,
     const ComponentPrecomputedIndexes *indexes,
     const CuMatrixBase<BaseFloat> &, // in_value
     const CuMatrixBase<BaseFloat> &, // out_value
     const CuMatrixBase<BaseFloat> &out_deriv,
     void *memo,
     Component *to_update_in,
     CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("ConstantComponent::Backprop");
   // we don't update in_deriv, since we set the flag
   // kBackpropAdds, and the output doesn't depend on the
   // input, so the input-derivative is zero.
   if (to_update_in) {
     ConstantComponent *to_update =
       dynamic_cast<ConstantComponent*>(to_update_in);
     if (to_update->is_updatable_) {
       // only do the update if the is_updatable_ flag is set.
       KALDI_ASSERT(to_update && to_update->is_updatable_);
       if (to_update->use_natural_gradient_ && !to_update->is_gradient_) {
         CuMatrix<BaseFloat> out_deriv_copy(out_deriv);
         BaseFloat scale = 1.0;
         to_update->preconditioner_.PreconditionDirections(&out_deriv_copy,
                                                           &scale);
         to_update->output_.AddRowSumMat(scale * to_update->learning_rate_,
                                         out_deriv_copy);
       } else {
         to_update->output_.AddRowSumMat(to_update->learning_rate_,
                                         out_deriv);
       }
     }
   }
 }

 void ConstantComponent::Read(std::istream &is, bool binary) {
   std::string token;
   ReadToken(is, binary, &token);
   if (token == "<ConstantComponent>") {
     ReadToken(is, binary, &token);
   }
   if (token == "<LearningRateFactor>") {
     ReadBasicType(is, binary, &learning_rate_factor_);
     ReadToken(is, binary, &token);
   } else {
     learning_rate_factor_ = 1.0;
   }
   if (token == "<IsGradient>") {
     ReadBasicType(is, binary, &is_gradient_);
     ReadToken(is, binary, &token);
   } else {
     is_gradient_ = false;
   }
   if (token == "<MaxChange>") {
     ReadBasicType(is, binary, &max_change_);
     ReadToken(is, binary, &token);
   } else {
     max_change_ = 0.0;
   }
   if (token == "<LearningRate>") {
     ReadBasicType(is, binary, &learning_rate_);
     ReadToken(is, binary, &token);
   } else {
     learning_rate_ = 0.001;
   }
   if (token != "<Output>") {
     KALDI_ERR << "Expected token <Output>, got " << token;
   }
   output_.Read(is, binary);
   ExpectToken(is, binary, "<IsUpdatable>");
   ReadBasicType(is, binary, &is_updatable_);
   ExpectToken(is, binary, "<UseNaturalGradient>");
   ReadBasicType(is, binary, &use_natural_gradient_);
   ExpectToken(is, binary, "</ConstantComponent>");
 }

 void ConstantComponent::Write(std::ostream &os, bool binary) const {
   WriteUpdatableCommon(os, binary);  // Write the opening tag and learning rate
   WriteToken(os, binary, "<Output>");
   output_.Write(os, binary);
   WriteToken(os, binary, "<IsUpdatable>");
   WriteBasicType(os, binary, is_updatable_);
   WriteToken(os, binary, "<UseNaturalGradient>");
   WriteBasicType(os, binary, use_natural_gradient_);
   WriteToken(os, binary, "</ConstantComponent>");
 }

 Component* ConstantComponent::Copy() const {
   return new ConstantComponent(*this);
 }

 void ConstantComponent::Scale(BaseFloat scale) {
   if (is_updatable_) {
     if (scale == 0.0) {
       output_.SetZero();
     } else {
       output_.Scale(scale);
     }
   }
 }

 void ConstantComponent::Add(BaseFloat alpha, const Component &other_in) {
   if (is_updatable_) {
     const ConstantComponent *other =
         dynamic_cast<const ConstantComponent*>(&other_in);
     KALDI_ASSERT(other != NULL);
     output_.AddVec(alpha, other->output_);
   }
 }

 void ConstantComponent::PerturbParams(BaseFloat stddev) {
   CuVector<BaseFloat> temp_output(output_.Dim(), kUndefined);
   temp_output.SetRandn();
   output_.AddVec(stddev, temp_output);
 }

 BaseFloat ConstantComponent::DotProduct(
     const UpdatableComponent &other_in) const {
   KALDI_ASSERT(is_updatable_);
   const ConstantComponent *other =
       dynamic_cast<const ConstantComponent*>(&other_in);
   KALDI_ASSERT(other != NULL);
   return VecVec(output_, other->output_);
 }

 void ConstantComponent::InitFromConfig(ConfigLine *cfl) {
   int32 output_dim = 0;
   InitLearningRatesFromConfig(cfl);
   bool ok = cfl->GetValue("output-dim", &output_dim);
   cfl->GetValue("is-updatable", &is_updatable_);
   cfl->GetValue("use-natural-gradient", &use_natural_gradient_);
   BaseFloat output_mean = 0.0, output_stddev = 0.0;
   cfl->GetValue("output-mean", &output_mean);
   cfl->GetValue("output-stddev", &output_stddev);
   if (!ok || cfl->HasUnusedValues() || output_dim <= 0) {
     KALDI_ERR << "Bad initializer " << cfl->WholeLine();
   }
   Vector<BaseFloat> output(output_dim);
   output.SetRandn();
   output.Scale(output_stddev);
   output.Add(output_mean);
   output_ = output;
 }

 int32 ConstantComponent::NumParameters() const {
   KALDI_ASSERT(is_updatable_);
   return output_.Dim();
 }

 void ConstantComponent::Vectorize(VectorBase<BaseFloat> *params) const {
   params->CopyFromVec(output_);
 }

 void ConstantComponent::UnVectorize(const VectorBase<BaseFloat> &params) {
   output_.CopyFromVec(params);
 }

 void ConstantComponent::ConsolidateMemory() {
   OnlineNaturalGradient temp(preconditioner_);
   preconditioner_.Swap(&temp);
 }

 std::string DropoutMaskComponent::Info() const {
   std::ostringstream stream;
   stream << Type()
          << ", output-dim=" << output_dim_
          << ", dropout-proportion=" << dropout_proportion_;
   if (continuous_)
     stream << ", continuous=true";
   return stream.str();
 }

 DropoutMaskComponent::DropoutMaskComponent():
     output_dim_(-1), dropout_proportion_(0.5), continuous_(false) { }

 DropoutMaskComponent::DropoutMaskComponent(
     const DropoutMaskComponent &other):
     output_dim_(other.output_dim_),
     dropout_proportion_(other.dropout_proportion_),
     continuous_(other.continuous_) { }

 void* DropoutMaskComponent::Propagate(
     const ComponentPrecomputedIndexes *indexes,
     const CuMatrixBase<BaseFloat> &in,
     CuMatrixBase<BaseFloat> *out) const {
   KALDI_ASSERT(in.NumRows() == 0 && out->NumCols() == output_dim_);
   BaseFloat dropout_proportion = dropout_proportion_;
   KALDI_ASSERT(dropout_proportion >= 0.0 && dropout_proportion <= 1.0);

   if (dropout_proportion == 0) {
     out->Set(1.0);
     return NULL;
   }

   if (continuous_) {
     if (test_mode_) {
       out->Set(1.0);
     } else {
       const_cast<CuRand<BaseFloat>&>(random_generator_).RandUniform(out);
       out->Scale(dropout_proportion * 4.0);
       // make the expected value 1.0.
       out->Add(1.0 - (2.0 * dropout_proportion));
     }
     return NULL;
   }

   if (test_mode_) {
     out->Set(1.0 - dropout_proportion);
     return NULL;
   }

   const_cast<CuRand<BaseFloat>&>(random_generator_).RandUniform(out);
   out->Add(-dropout_proportion);
   out->ApplyHeaviside();

   if (out->NumCols() == 2 || out->NumCols() == 3) {
     // This is a kind of special case relevant to LSTms.
     // To generate data where it's never the case that both of the dimensions
     // for a row are zero, we generate uniformly distributed data (call this u_i),
     // and for row i, set (*out)(i, 0) = (0 if u_i < dropout_proportion else 1)
     //                and (*out)(i, 1) = (0 if u_i > 1-dropout_proportion else 1)
     int32 num_rows = out->NumRows();
     // later we may make this a bit more efficient.
     CuVector<BaseFloat> temp(num_rows, kUndefined);
     const_cast<CuRand<BaseFloat>&>(random_generator_).RandUniform(&temp);
     temp.Add(-dropout_proportion);
     out->CopyColFromVec(temp, 0);
     temp.Add(-1.0 + (2.0 * dropout_proportion));
     // Now, 'temp' contains the original uniformly-distributed data plus
     // -(1 - dropout_proportion).
     temp.Scale(-1.0);
     out->CopyColFromVec(temp, 1);
     out->ApplyHeaviside();
   }
   return NULL;
 }


 void DropoutMaskComponent::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary, "<DropoutMaskComponent>", "<OutputDim>");
   ReadBasicType(is, binary, &output_dim_);
   ExpectToken(is, binary, "<DropoutProportion>");
   ReadBasicType(is, binary, &dropout_proportion_);
   if (PeekToken(is, binary) == 'T') {
     ExpectToken(is, binary, "<TestMode>");
     ReadBasicType(is, binary, &test_mode_);  // read test mode
   } else {
     test_mode_ = false;
   }
   if (PeekToken(is, binary) == 'C') {
     ExpectToken(is, binary, "<Continuous>");
     continuous_ = true;
   } else {
     continuous_ = false;
   }
   ExpectToken(is, binary, "</DropoutMaskComponent>");
 }


 void DropoutMaskComponent::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<DropoutMaskComponent>");
   WriteToken(os, binary, "<OutputDim>");
   WriteBasicType(os, binary, output_dim_);
   WriteToken(os, binary, "<DropoutProportion>");
   WriteBasicType(os, binary, dropout_proportion_);
   WriteToken(os, binary, "<TestMode>");
   WriteBasicType(os, binary, test_mode_);
   if (continuous_)
     WriteToken(os, binary, "<Continuous>");
   WriteToken(os, binary, "</DropoutMaskComponent>");
 }

 Component* DropoutMaskComponent::Copy() const {
   return new DropoutMaskComponent(*this);
 }

 void DropoutMaskComponent::InitFromConfig(ConfigLine *cfl) {
   output_dim_ = 0;
   bool ok = cfl->GetValue("output-dim", &output_dim_);
   KALDI_ASSERT(ok && output_dim_ > 0);
   dropout_proportion_ = 0.5;
   cfl->GetValue("dropout-proportion", &dropout_proportion_);
   continuous_ = false;
   cfl->GetValue("continuous", &continuous_);
   test_mode_ = false;
   cfl->GetValue("test-mode", &test_mode_);
 }


 std::string GeneralDropoutComponent::Info() const {
   std::ostringstream stream;
   stream << Type()
          << ", dim=" << dim_
          << ", block-dim=" << block_dim_
          << ", dropout-proportion=" << dropout_proportion_;
   if (continuous_)
     stream << ", continuous=true";
   if (specaugment_max_proportion_ != 0)
     stream << ", specaugment-max-proportion=" << specaugment_max_proportion_
            << ", specaugment-max-regions=" << specaugment_max_regions_;
   if (time_period_ > 0)
     stream << ", time-period=" << time_period_;
   return stream.str();
 }

 GeneralDropoutComponent::GeneralDropoutComponent():
     dim_(-1), block_dim_(-1), time_period_(0),
     dropout_proportion_(0.5),
     specaugment_max_proportion_(0.0),
     specaugment_max_regions_(1),
     continuous_(false) { }

 GeneralDropoutComponent::GeneralDropoutComponent(
     const GeneralDropoutComponent &other):
     dim_(other.dim_),
     block_dim_(other.block_dim_),
     time_period_(other.time_period_),
     dropout_proportion_(other.dropout_proportion_),
     specaugment_max_proportion_(other.specaugment_max_proportion_),
     specaugment_max_regions_(other.specaugment_max_regions_),
     continuous_(other.continuous_) { }

 void* GeneralDropoutComponent::Propagate(
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in,
     CuMatrixBase<BaseFloat> *out) const {

   KALDI_ASSERT(SameDim(in, *out));

   // The following will do nothing if 'out' and 'in' refer to the same data.
   out->CopyFromMat(in);

   if (test_mode_ ||
       (dropout_proportion_ == 0.0 && specaugment_max_proportion_ == 0.0))
     return NULL;

   const GeneralDropoutComponentPrecomputedIndexes *indexes =
     dynamic_cast<const GeneralDropoutComponentPrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL);

   CuMatrix<BaseFloat> *mask = GetMemo(indexes->num_mask_rows);

   if (block_dim_ < dim_) {
     KALDI_ASSERT(out->Stride() == out->NumCols());
     int32 num_rows = out->NumRows(),
         dim_multiple = dim_  / block_dim_,
         num_rows_reshaped = num_rows * dim_multiple;
     CuSubMatrix<BaseFloat> out_reshaped(out->Data(), num_rows_reshaped,
                                         block_dim_, block_dim_);
     out_reshaped.MulRows(*mask, indexes->indexes);
   } else {
     out->MulRows(*mask, indexes->indexes);
   }
   return mask;
 }

 void GeneralDropoutComponent::Backprop(
     const std::string &debug_info,
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &, // in_value
     const CuMatrixBase<BaseFloat> &, // out_value
     const CuMatrixBase<BaseFloat> &out_deriv,
     void *memo,
     Component *to_update,
     CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("GeneralDropoutComponent::Backprop");
   KALDI_ASSERT(in_deriv != NULL && SameDim(*in_deriv, out_deriv));

   // The following will do no work if in_deriv->Data() == out_deriv.Data().
   in_deriv->CopyFromMat(out_deriv);

   if (test_mode_ ||
       (dropout_proportion_ == 0.0 && specaugment_max_proportion_ == 0.0)) {
     KALDI_ASSERT(memo == NULL);
     return;
   }

   const GeneralDropoutComponentPrecomputedIndexes *indexes =
      dynamic_cast<const GeneralDropoutComponentPrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL && memo != NULL);
   CuMatrix<BaseFloat> *mask = reinterpret_cast<CuMatrix<BaseFloat>*>(memo);

   if (block_dim_ < dim_) {
     KALDI_ASSERT(in_deriv->Stride() == in_deriv->NumCols());
     int32 num_rows = in_deriv->NumRows(),
         dim_multiple = dim_  / block_dim_,
         num_rows_reshaped = num_rows * dim_multiple;
     CuSubMatrix<BaseFloat> in_deriv_reshaped(in_deriv->Data(),
                                              num_rows_reshaped,
                                              block_dim_, block_dim_);
     in_deriv_reshaped.MulRows(*mask, indexes->indexes);
   } else {
     in_deriv->MulRows(*mask, indexes->indexes);
   }
 }

 void GeneralDropoutComponent::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary, "<GeneralDropoutComponent>", "<Dim>");
   ReadBasicType(is, binary, &dim_);
   ExpectToken(is, binary, "<BlockDim>");
   ReadBasicType(is, binary, &block_dim_);
   ExpectToken(is, binary, "<TimePeriod>");
   ReadBasicType(is, binary, &time_period_);
   ExpectToken(is, binary, "<DropoutProportion>");
   ReadBasicType(is, binary, &dropout_proportion_);
   if (PeekToken(is, binary) == 'S') {
     ExpectToken(is, binary, "<SpecAugmentMaxProportion>");
     ReadBasicType(is, binary, &specaugment_max_proportion_);
     if (PeekToken(is, binary) == 'S') {
       ExpectToken(is, binary, "<SpecAugmentMaxRegions>");
       ReadBasicType(is, binary, &specaugment_max_regions_);
     } else {
       specaugment_max_regions_ = 1;
     }
   } else {
     specaugment_max_proportion_ = 0.0;
     specaugment_max_regions_ = 1;
   }
   if (PeekToken(is, binary) == 'T') {
     ExpectToken(is, binary, "<TestMode>");
     test_mode_ = true;
   } else {
     test_mode_ = false;
   }
   if (PeekToken(is, binary) == 'C') {
     ExpectToken(is, binary, "<Continuous>");
     continuous_ = true;
   } else {
     continuous_ = false;
   }
   ExpectToken(is, binary, "</GeneralDropoutComponent>");
 }


 void GeneralDropoutComponent::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<GeneralDropoutComponent>");
   WriteToken(os, binary, "<Dim>");
   WriteBasicType(os, binary, dim_);
   WriteToken(os, binary, "<BlockDim>");
   WriteBasicType(os, binary, block_dim_);
   WriteToken(os, binary, "<TimePeriod>");
   WriteBasicType(os, binary, time_period_);
   WriteToken(os, binary, "<DropoutProportion>");
   WriteBasicType(os, binary, dropout_proportion_);
   if (specaugment_max_proportion_) {
     WriteToken(os, binary, "<SpecAugmentMaxProportion>");
     WriteBasicType(os, binary, specaugment_max_proportion_);
     if (specaugment_max_regions_ != 1) {
       WriteToken(os, binary, "<SpecAugmentMaxRegions>");
       WriteBasicType(os, binary, specaugment_max_regions_);
     }
   }
   if (test_mode_)
     WriteToken(os, binary, "<TestMode>");
   if (continuous_)
     WriteToken(os, binary, "<Continuous>");
   WriteToken(os, binary, "</GeneralDropoutComponent>");
 }

 Component* GeneralDropoutComponent::Copy() const {
   return new GeneralDropoutComponent(*this);
 }

 void GeneralDropoutComponent::InitFromConfig(ConfigLine *cfl) {
   dim_ = 0;
   bool ok = cfl->GetValue("dim", &dim_);
   KALDI_ASSERT(ok && dim_ > 0);
   block_dim_ = dim_;
   cfl->GetValue("block-dim", &block_dim_);
   if (!(block_dim_ > 0 && dim_ % block_dim_ == 0))
     KALDI_ERR << "Invalid configuration dim=" << dim_
               << ", block-dim=" << block_dim_;
   time_period_ = 0;
   cfl->GetValue("time-period", &time_period_);
   dropout_proportion_ = 0.5;
   cfl->GetValue("dropout-proportion", &dropout_proportion_);

   specaugment_max_proportion_ = 0.0;
   cfl->GetValue("specaugment-max-proportion", &specaugment_max_proportion_);
   specaugment_max_regions_ = 1;
   cfl->GetValue("specaugment-max-regions", &specaugment_max_regions_);
   continuous_ = false;
   cfl->GetValue("continuous", &continuous_);
   test_mode_ = false;
   cfl->GetValue("test-mode", &test_mode_);

   if (specaugment_max_proportion_ != 0.0) {
     if (specaugment_max_proportion_ < 0.0 ||
         specaugment_max_proportion_ > 1.0 || continuous_ ||
         specaugment_max_regions_ < 1) {
       KALDI_ERR << "Invalid config values: specaugment-max-proportion = "
                 << specaugment_max_proportion_ << ", continuous = "
                 << std::boolalpha << continuous_
                 << ", specaugment-max-regions = " << specaugment_max_regions_;
     }
   }
 }


 CuMatrix<BaseFloat>* GeneralDropoutComponent::GetMemo(
     int32 num_mask_rows) const {
   KALDI_ASSERT(num_mask_rows > 0 && !test_mode_ &&
                (dropout_proportion_ > 0.0 ||
                 specaugment_max_proportion_ != 0.0));
   CuMatrix<BaseFloat> *ans = new CuMatrix<BaseFloat>(num_mask_rows, block_dim_,
                                                      kUndefined);

   if (specaugment_max_proportion_ != 0.0) {
     // This block takes care of the case where we are doing SpecAugment.
     int32 num_freq_bins = block_dim_;
     Matrix<BaseFloat> mask(num_mask_rows, block_dim_);
     mask.Set(1.0);
     int32 specaugment_max_zeroed = static_cast<int32>(
         num_freq_bins * specaugment_max_proportion_  +  0.5);
     for (int32 seq = 0; seq < num_mask_rows; seq++) {
       // actually seq is more like a sub-part of a sequence, in the case where
       // time_period_ is not zero.
       SubVector<BaseFloat> this_mask(mask, seq);  // will be all ones, right now.
       int32 num_bins_zeroed = RandInt(0, specaugment_max_zeroed);
       if (num_bins_zeroed != 0) {
         // This is not quite the same as the paper, it is allowed to "wrap around"
         // from the top to the bottom of the frequency spectrum.
         int32 start_bin = RandInt(0, num_freq_bins - 1);
         for (int32 i = start_bin; i < start_bin + num_bins_zeroed; i++)
           this_mask(i % num_freq_bins) = 0.0;

         // if specaugment_max_regions_ is not 1 (e.g. if it's 2 or 3), we want
         // to (possibly) split up the zeroed region into more segments.
         // The way we do this is a bit odd, but it was hard to think of
         // an elegant way to do it.  We just choose a random half of the spectrum
         // (viewing it as a circle, so choosing a random half of the circle)
         // and swap around that half, i.e. flip it on its head.
         for (int32 n = 1; n < specaugment_max_regions_; n++) {
           int32 half_bin_size = num_freq_bins / 2,
               quarter_bin_size = half_bin_size / 2,
               start_bin = RandInt(0, num_freq_bins - 1),
               end_bin = start_bin + half_bin_size;
           for (int32 i = 0; i < quarter_bin_size; i++) {
             BaseFloat &a = this_mask((start_bin + i) % num_freq_bins),
                 &b = this_mask((end_bin - i) % num_freq_bins);
             std::swap(a, b);
           }
         }
       }
     }
     ans->CopyFromMat(mask);
     return ans;
   }

   BaseFloat dropout_proportion = dropout_proportion_;

   // This const_cast is only safe assuming you don't attempt
   // to use multi-threaded code with the GPU.
   const_cast<CuRand<BaseFloat>&>(random_generator_).RandUniform(ans);

   if (!continuous_) {
     ans->Add(-dropout_proportion);
     // now, a proportion "dropout_proportion" will be < 0.0. After applying the
     // function (x>0?1:0), a proportion "dropout_proportion" will be zero and (1 -
     // dropout_proportion) will be 1.0.
     ans->ApplyHeaviside();
     ans->Scale(1.0 / (1.0 - dropout_proportion));
   } else {
     ans->Scale(dropout_proportion * 4.0);
     // make the expected value 1.0.
     ans->Add(1.0 - (2.0 * dropout_proportion));
   }
   return ans;
 }

 ComponentPrecomputedIndexes* GeneralDropoutComponent::PrecomputeIndexes(
       const MiscComputationInfo &misc_info,
       const std::vector<Index> &input_indexes,
       const std::vector<Index> &output_indexes,
       bool need_backprop) const {
   KALDI_ASSERT(input_indexes == output_indexes);

   GeneralDropoutComponentPrecomputedIndexes *ans = new
       GeneralDropoutComponentPrecomputedIndexes;
   int32 size = input_indexes.size(), time_period = time_period_,
       cur_row = 0;
   std::vector<int32> indexes(size);
   // the map 'm' will map from a pair from (n, t) value to the row-index of the
   // dropout-mask matrix*.   However, the 't' isn't a real 't' value;
   // if time_period_ == 0, the 't' value will just be zero; otherwise,
   // it will be t divided by time_period_ (rounding towards negative infinity).

   // *before considering effects related to when block_dim_ != dim_.

   std::unordered_map<std::pair<int32,int32>, int32, PairHasher<int32> > m;
   for (int32 i = 0; i < size; i++) {
     int32 n = input_indexes[i].n,
         t = (time_period == 0 ? 0 : DivideRoundingDown(input_indexes[i].t,
                                                        time_period));
     std::pair<int32, int32> p(n, t);

     std::unordered_map<std::pair<int32,int32>, int32,
                        PairHasher<int32> >::const_iterator
         iter = m.find(p);
     if (iter != m.end()) {
       indexes[i] = iter->second;
     } else {
       m[p] = cur_row;
       indexes[i] = cur_row;
       cur_row++;
     }
   }
   int32 multiple = dim_ / block_dim_;
   ans->num_mask_rows = cur_row;
   if (multiple == 1) {
     ans->indexes.CopyFromVec(indexes);
   } else {
     ans->num_mask_rows = cur_row * multiple;
     std::vector<int32> repeated_indexes;
     repeated_indexes.reserve(size * multiple);
     for (int32 i = 0; i < size; i++) {
       int32 row = indexes[i];
       for (int32 j = 0; j < multiple; j++)
         repeated_indexes.push_back(row);
     }
     ans->indexes.CopyFromVec(repeated_indexes);
   }
   return ans;
 }

 void GeneralDropoutComponentPrecomputedIndexes::Write(std::ostream &os,
     bool binary) const {
   WriteToken(os, binary,
              "<GeneralDropoutComponentPrecomputedIndexes>");
   WriteToken(os, binary, "<NumMaskRows>");
   WriteBasicType(os, binary, num_mask_rows);
   WriteToken(os, binary, "<Indexes>");
   indexes.Write(os, binary);
   WriteToken(os, binary,
              "</GeneralDropoutComponentPrecomputedIndexes>");
 }

 void GeneralDropoutComponentPrecomputedIndexes::Read(std::istream &is,
     bool binary) {
   ExpectOneOrTwoTokens(is, binary,
                        "<GeneralDropoutComponentPrecomputedIndexes>",
                        "<NumMaskRows>");
   ReadBasicType(is, binary, &num_mask_rows);
   ExpectToken(is, binary, "<Indexes>");
   indexes.Read(is, binary);
   ExpectToken(is, binary,
               "</GeneralDropoutComponentPrecomputedIndexes>");
 }

 std::string SpecAugmentTimeMaskComponent::Info() const {
   std::ostringstream stream;
   stream << Type()
          << ", dim=" << dim_
          << ", zeroed-proportion=" << zeroed_proportion_
          << ", time-mask-max-frames=" << time_mask_max_frames_;
   return stream.str();
 }

 SpecAugmentTimeMaskComponent::SpecAugmentTimeMaskComponent():
     dim_(-1), zeroed_proportion_(0.25),
     time_mask_max_frames_(10) { }

 SpecAugmentTimeMaskComponent::SpecAugmentTimeMaskComponent(
     const SpecAugmentTimeMaskComponent &other):
     dim_(other.dim_),
     zeroed_proportion_(other.zeroed_proportion_),
     time_mask_max_frames_(other.time_mask_max_frames_) { }

 void* SpecAugmentTimeMaskComponent::Propagate(
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in,
     CuMatrixBase<BaseFloat> *out) const {

   KALDI_ASSERT(SameDim(in, *out));

   // The following will do nothing if 'out' and 'in' refer to the same data.
   out->CopyFromMat(in);

   if (test_mode_ ||
       zeroed_proportion_ == 0.0)
     return NULL;

   const SpecAugmentTimeMaskComponentPrecomputedIndexes *indexes =
     dynamic_cast<const SpecAugmentTimeMaskComponentPrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL);

   CuVector<BaseFloat> *mask = GetMemo(*indexes);
   out->MulRowsVec(*mask);
   return mask;
 }

 void SpecAugmentTimeMaskComponent::Backprop(
     const std::string &debug_info,
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &, // in_value
     const CuMatrixBase<BaseFloat> &, // out_value
     const CuMatrixBase<BaseFloat> &out_deriv,
     void *memo,
     Component *to_update,
     CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("SpecAugmentTimeMaskComponent::Backprop");
   KALDI_ASSERT(in_deriv != NULL && SameDim(*in_deriv, out_deriv));

   // The following will do no work if in_deriv->Data() == out_deriv.Data().
   in_deriv->CopyFromMat(out_deriv);

   if (test_mode_ || zeroed_proportion_ == 0.0) {
     KALDI_ASSERT(memo == NULL);
     return;
   }

   const SpecAugmentTimeMaskComponentPrecomputedIndexes *indexes =
     dynamic_cast<const SpecAugmentTimeMaskComponentPrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL && memo != NULL);
   CuVector<BaseFloat> *mask = reinterpret_cast<CuVector<BaseFloat>*>(memo);

   in_deriv->MulRowsVec(*mask);
 }

 void SpecAugmentTimeMaskComponent::Read(std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary, "<SpecAugmentTimeMaskComponent>", "<Dim>");
   ReadBasicType(is, binary, &dim_);
   ExpectToken(is, binary, "<ZeroedProportion>");
   ReadBasicType(is, binary, &zeroed_proportion_);
   ExpectToken(is, binary, "<TimeMaskMaxFrames>");
   ReadBasicType(is, binary, &time_mask_max_frames_);
   if (PeekToken(is, binary) == 'T') {
     ExpectToken(is, binary, "<TestMode>");
     test_mode_ = true;
   } else {
     test_mode_ = false;
   }
   ExpectToken(is, binary, "</SpecAugmentTimeMaskComponent>");
 }


 void SpecAugmentTimeMaskComponent::Write(std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<SpecAugmentTimeMaskComponent>");
   WriteToken(os, binary, "<Dim>");
   WriteBasicType(os, binary, dim_);
   WriteToken(os, binary, "<ZeroedProportion>");
   WriteBasicType(os, binary, zeroed_proportion_);
   WriteToken(os, binary, "<TimeMaskMaxFrames>");
   WriteBasicType(os, binary, time_mask_max_frames_);
   if (test_mode_)
     WriteToken(os, binary, "<TestMode>");
   WriteToken(os, binary, "</SpecAugmentTimeMaskComponent>");
 }

 Component* SpecAugmentTimeMaskComponent::Copy() const {
   return new SpecAugmentTimeMaskComponent(*this);
 }

 void SpecAugmentTimeMaskComponent::InitFromConfig(ConfigLine *cfl) {
   dim_ = 0;
   bool ok = cfl->GetValue("dim", &dim_);
   KALDI_ASSERT(ok && dim_ > 0);
   zeroed_proportion_ = 0.25;
   cfl->GetValue("zeroed-proportion", &zeroed_proportion_);
   time_mask_max_frames_ = 10;
   cfl->GetValue("time-mask-max-frames", &time_mask_max_frames_);
   KALDI_ASSERT(time_mask_max_frames_ > 1);
 }


 CuVector<BaseFloat>* SpecAugmentTimeMaskComponent::GetMemo(
     const SpecAugmentTimeMaskComponentPrecomputedIndexes &indexes_in) const {

   const std::vector<std::vector<int32> > &indexes = indexes_in.indexes;
   int32 num_sequences = indexes.size();
   BaseFloat z = zeroed_proportion_;
   int32 time_mask_max_frames = time_mask_max_frames_,
       non_time_mask_max_frames = time_mask_max_frames * (1-z) / z;
   KALDI_ASSERT(time_mask_max_frames > 0 &&
                non_time_mask_max_frames > 0);
   Vector<BaseFloat> mask(indexes_in.tot_size, kUndefined);

   for (int32 s = 0; s < num_sequences; s++) {
     // this_row_indexes gives us, for a particular sequence, the ordered list of
     // row-indexes where we can find the successive 't' values of this sequence.
     const std::vector<int32> this_row_indexes = indexes[s];
     int32 seq_length = this_row_indexes.size();
     KALDI_ASSERT(seq_length > 0);

     int32 t = 0;
     while (t < seq_length) {
       // add a non-zeroed, then a zeroed, segment, repeatedly until we have
       // filled the sequence.  The first time we choose randomly whether to add
       // a zeroed or a non-zeroed segment.
       if (t > 0 || WithProb(z)) {
         int32 nonzeroed_length = RandInt(1, non_time_mask_max_frames);
         for (; t < seq_length && nonzeroed_length > 0; t++, nonzeroed_length--)
           mask(this_row_indexes[t]) = 1.0;
       }
       int32 zeroed_length = RandInt(1, time_mask_max_frames);
       for (; t < seq_length && zeroed_length > 0; t++, zeroed_length--)
         mask(this_row_indexes[t]) = 0.0;
     }
   }
   return new CuVector<BaseFloat>(mask);
 }

 ComponentPrecomputedIndexes* SpecAugmentTimeMaskComponent::PrecomputeIndexes(
       const MiscComputationInfo &misc_info,
       const std::vector<Index> &input_indexes,
       const std::vector<Index> &output_indexes,
       bool need_backprop) const {
   KALDI_ASSERT(input_indexes == output_indexes);

   SpecAugmentTimeMaskComponentPrecomputedIndexes *ans = new
       SpecAugmentTimeMaskComponentPrecomputedIndexes;
   int32 size = input_indexes.size();
   KALDI_ASSERT(size != 0);
   // 'sort_indexes' will contain the n and t values and then
   // the index into input_indexes.  When we sort these, it will
   // sort first on the n value and then on the t, which will allow us
   // to create ans->indexes.
   std::vector<std::tuple<int32, int32, int32> > sort_indexes(size);

   std::unordered_set<int32> all_n_values;  // just for determining how many
                                            // there are.
   for (int32 i = 0; i < size; i++) {
     int32 n = input_indexes[i].n;
     all_n_values.insert(n);
     std::get<0>(sort_indexes[i]) = n;
     std::get<1>(sort_indexes[i]) = input_indexes[i].t;
     std::get<2>(sort_indexes[i]) = i;
   }
   std::sort(sort_indexes.begin(), sort_indexes.end());

   // the stuff with n_idx is because we don't assume the
   // n values start from zero and are consecutive.
   int32 num_n_values = all_n_values.size(),
       n_idx = 0,
       cur_n_value = std::get<0>(sort_indexes[0]);
   ans->indexes.resize(num_n_values);
   for (int32 i = 0; i < size; i++) {
     std::tuple<int32, int32, int32> &tp(sort_indexes[i]);
     int32 n = std::get<0>(tp),
         row_index = std::get<2>(tp);
     KALDI_ASSERT(n >= cur_n_value);
     if (n > cur_n_value) {
       n_idx++;
       KALDI_ASSERT(n_idx < num_n_values);
       cur_n_value = n;
     }
     ans->indexes[n_idx].push_back(row_index);
   }
   n_idx++;
   KALDI_ASSERT(n_idx == num_n_values);
   ans->tot_size = size;
   return ans;
 }

 void SpecAugmentTimeMaskComponentPrecomputedIndexes::Write(std::ostream &os,
     bool binary) const {
   WriteToken(os, binary,
              "<SpecAugmentTimeMaskComponentPrecomputedIndexes>");
   WriteToken(os, binary, "<Indexes>");
   int32 size = indexes.size();
   WriteBasicType(os, binary, size);
   for (int32 i = 0; i < size; i++) {
     WriteIntegerVector(os, binary, indexes[i]);
   }
   WriteToken(os, binary,
              "</SpecAugmentTimeMaskComponentPrecomputedIndexes>");
 }

 void SpecAugmentTimeMaskComponentPrecomputedIndexes::Read(std::istream &is,
     bool binary) {
   ExpectOneOrTwoTokens(is, binary,
                        "<SpecAugmentTimeMaskComponentPrecomputedIndexes>",
                        "<Indexes>");
   int32 size;
   ReadBasicType(is, binary, &size);
   indexes.clear();
   indexes.resize(size);
   for (int32 i = 0; i < size; i++)
     ReadIntegerVector(is, binary, &(indexes[i]));
   ExpectToken(is, binary,
               "</SpecAugmentTimeMaskComponentPrecomputedIndexes>");
   tot_size = 0;
   for (auto v : indexes) tot_size += v.size();
 }


 } // namespace nnet3
 } // namespace kaldi
kaldi::nnet3::StatisticsPoolingComponent::Check
void Check() const
Definition: nnet-general-component.cc:592

kaldi::nnet3::SpecAugmentTimeMaskComponentPrecomputedIndexes::indexes
std::vector< std::vector< int32 > > indexes
Definition: nnet-general-component.h:1093

kaldi::nnet3::BackpropTruncationComponent::scale_
BaseFloat scale_
Definition: nnet-general-component.h:533

kaldi::nnet3::BackpropTruncationComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-general-component.cc:1059

kaldi::nnet3::DistributeComponent::IsComputable
virtual bool IsComputable(const MiscComputationInfo &misc_info, const Index &output_index, const IndexSet &input_index_set, std::vector< Index > *used_inputs) const
This function only does something interesting for non-simple Components, and it exists to make it pos...
Definition: nnet-general-component.cc:72

kaldi::nnet3::SpecAugmentTimeMaskComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-general-component.cc:2042

kaldi::CuRand
Definition: cu-common.h:152

kaldi::nnet3::DropoutMaskComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:1499

kaldi::CuVectorBase::MulElements
void MulElements(const CuVectorBase< Real > &v)
Definition: cu-vector.cc:838

kaldi::nnet3::StatisticsPoolingComponent::left_context_
int32 left_context_
Definition: nnet-general-component.h:415

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::CuMatrixBase::Stride
MatrixIndexT Stride() const
Definition: cu-matrix.h:217

kaldi::nnet3::StatisticsExtractionComponent::ReorderIndexes
virtual void ReorderIndexes(std::vector< Index > *input_indexes, std::vector< Index > *output_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-general-component.cc:389

kaldi::nnet3::BackpropTruncationComponentPrecomputedIndexes::zeroing_sum
BaseFloat zeroing_sum
Definition: nnet-general-component.h:581

kaldi::nnet3::SpecAugmentTimeMaskComponentPrecomputedIndexes::Read
virtual void Read(std::istream &is, bool binary)
Definition: nnet-general-component.cc:2108

kaldi::nnet3::SpecAugmentTimeMaskComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:1976

kaldi::nnet3::DistributeComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-general-component.cc:194

kaldi::nnet3::BackpropTruncationComponentPrecomputedIndexes
Definition: nnet-general-component.h:569

kaldi::DivideRoundingDown
static int32 DivideRoundingDown(int32 a, int32 b)
Returns a / b, rounding towards negative infinity in all cases.
Definition: kaldi-math.h:287

kaldi::CuMatrixBase::ApplyPow
void ApplyPow(Real power)
Definition: cu-matrix.h:438

kaldi::ConfigLine::WholeLine
const std::string WholeLine()
Definition: text-utils.h:230

kaldi::nnet3::DistributeComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-general-component.h:67

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::nnet3::SpecAugmentTimeMaskComponentPrecomputedIndexes
Definition: nnet-general-component.h:1084

kaldi::CuVectorBase::SetZero
void SetZero()
Math operations.
Definition: cu-vector.cc:1098

kaldi::nnet3::BackpropTruncationComponentPrecomputedIndexes::Read
virtual void Read(std::istream &istream, bool binary)
Definition: nnet-general-component.cc:969

kaldi::nnet3::SpecAugmentTimeMaskComponent::dim_
int32 dim_
Definition: nnet-general-component.h:1071

kaldi::nnet3::StatisticsPoolingComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:626

kaldi::nnet3::BackpropTruncationComponent::zeroing_threshold_
BaseFloat zeroing_threshold_
Definition: nnet-general-component.h:539

kaldi::nnet3::DistributeComponent::ComputeInputIndexAndBlock
void ComputeInputIndexAndBlock(const Index &output_index, Index *input_index, int32 *block) const
Definition: nnet-general-component.cc:46

kaldi::WriteIntegerPairVector
void WriteIntegerPairVector(std::ostream &os, bool binary, const std::vector< std::pair< T, T > > &v)
Function for writing STL vectors of pairs of integer types.
Definition: io-funcs-inl.h:93

kaldi::CuArray::CopyFromVec
void CopyFromVec(const std::vector< T > &src)
This function resizes if needed.
Definition: cu-array-inl.h:120

kaldi::nnet3::GeneralDropoutComponent::dropout_proportion_
BaseFloat dropout_proportion_
Definition: nnet-general-component.h:945

kaldi::nnet3::StatisticsPoolingComponent::output_stddevs_
bool output_stddevs_
Definition: nnet-general-component.h:418

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::ConstantComponent::use_natural_gradient_
bool use_natural_gradient_
Definition: nnet-general-component.h:704

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::nnet3::StatisticsExtractionComponent::include_variance_
bool include_variance_
Definition: nnet-general-component.h:273

kaldi::nnet3::BackpropTruncationComponent::count_
double count_
Definition: nnet-general-component.h:562

kaldi::nnet3::StatisticsPoolingComponent::OutputDim
virtual int32 OutputDim() const
Returns output-dimension of this component.
Definition: nnet-general-component.h:346

kaldi::RandUniform
float RandUniform(struct RandomState *state=NULL)
Returns a random number strictly between 0 and 1.
Definition: kaldi-math.h:151

kaldi::CuArrayBase::CopyToVec
void CopyToVec(std::vector< T > *dst) const
This function resizes *dst if needed.
Definition: cu-array-inl.h:177

kaldi::nnet3::BackpropTruncationComponent::recurrence_interval_
int32 recurrence_interval_
Definition: nnet-general-component.h:548

kaldi::nnet3::StatisticsExtractionComponent::output_period_
int32 output_period_
Definition: nnet-general-component.h:272

kaldi::nnet3::CopyPairVector
static void CopyPairVector(const CuArray< Int32Pair > &in, std::vector< std::pair< int32, int32 > > *out)
Definition: nnet-general-component.cc:31

kaldi::CuVectorBase::CopyColFromMat
void CopyColFromMat(const CuMatrixBase< Real > &mat, MatrixIndexT col)
Definition: cu-vector.cc:103

kaldi::nnet3::Component
Abstract base-class for neural-net components.
Definition: nnet-component-itf.h:114

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet3::SpecAugmentTimeMaskComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:1959

kaldi::nnet3::StatisticsPoolingComponentPrecomputedIndexes
Definition: nnet-general-component.h:429

kaldi::CuVectorBase::Add
void Add(Real value)
Definition: cu-vector.cc:1157

kaldi::nnet3::GeneralDropoutComponent::dim_
int32 dim_
Definition: nnet-general-component.h:934

kaldi::CuMatrixBase::AddRows
void AddRows(Real alpha, const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Does for each row r, this.Row(r) += alpha * src.row(indexes[r]).
Definition: cu-matrix.cc:2766

kaldi::nnet3::GeneralDropoutComponentPrecomputedIndexes::Read
virtual void Read(std::istream &is, bool binary)
Definition: nnet-general-component.cc:1877

kaldi::nnet3::StatisticsExtractionComponent::input_dim_
int32 input_dim_
Definition: nnet-general-component.h:270

kaldi::CuMatrixBase::AddRowRanges
void AddRowRanges(const CuMatrixBase< Real > &src, const CuArrayBase< Int32Pair > &indexes)
For each row r of this and for each column c, do (*this)(r, c) +=  src(j, c), where j ranges from ind...
Definition: cu-matrix.cc:2931

kaldi::nnet3::GeneralDropoutComponent::continuous_
bool continuous_
Definition: nnet-general-component.h:951

kaldi::nnet3::BackpropTruncationComponent::zeroing_interval_
int32 zeroing_interval_
Definition: nnet-general-component.h:543

kaldi::nnet3::GeneralDropoutComponentPrecomputedIndexes::indexes
CuArray< int32 > indexes
Definition: nnet-general-component.h:978

kaldi::nnet3::BackpropTruncationComponent::Init
void Init(int32 dim, BaseFloat scale, BaseFloat clipping_threshold, BaseFloat zeroing_threshold, int32 zeroing_interval, int32 recurrence_interval)
Definition: nnet-general-component.cc:1000

kaldi::nnet3::StatisticsExtractionComponent
Definition: nnet-general-component.h:201

kaldi::nnet3::ConstantComponent::Add
virtual void Add(BaseFloat alpha, const Component &other)
This virtual function when called by – an UpdatableComponent adds the parameters of another updatabl...
Definition: nnet-general-component.cc:1341

kaldi::nnet3::GeneralDropoutComponentPrecomputedIndexes
Definition: nnet-general-component.h:960

kaldi::nnet3::IndexSet
An abstract representation of a set of Indexes.
Definition: nnet-computation-graph.h:322

kaldi::WithProb
bool WithProb(BaseFloat prob, struct RandomState *state)
Definition: kaldi-math.cc:72

kaldi::nnet3::DistributeComponent::input_dim_
int32 input_dim_
Definition: nnet-general-component.h:128

kaldi::CuVectorBase::Set
void Set(Real value)
Definition: cu-vector.cc:1135

kaldi::nnet3::DropoutMaskComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-general-component.cc:1402

kaldi::nnet3::SpecAugmentTimeMaskComponent::GetMemo
CuVector< BaseFloat > * GetMemo(const SpecAugmentTimeMaskComponentPrecomputedIndexes &indexes) const
Definition: nnet-general-component.cc:2005

kaldi::nnet3::UpdatableComponent::InitLearningRatesFromConfig
void InitLearningRatesFromConfig(ConfigLine *cfl)
Definition: nnet-component-itf.cc:248

kaldi::CuMatrixBase::Sum
Real Sum() const
Definition: cu-matrix.cc:3012

kaldi::nnet3::DropoutMaskComponent::dropout_proportion_
BaseFloat dropout_proportion_
Definition: nnet-general-component.h:792

kaldi::CuMatrixBase::ApplyHeaviside
void ApplyHeaviside()
Definition: cu-matrix.h:447

kaldi::CuMatrixBase::ApplyFloor
void ApplyFloor(Real floor_val)
Definition: cu-matrix.h:451

kaldi::CuVectorBase::AddDiagMat2
void AddDiagMat2(Real alpha, const CuMatrixBase< Real > &M, MatrixTransposeType trans, Real beta)
Add the diagonal of a matrix times itself: *this = diag(M M^T) + beta * *this (if trans == kNoTrans)...
Definition: cu-vector.cc:595

kaldi::nnet3::ConstantComponent::ConstantComponent
ConstantComponent()
Definition: nnet-general-component.cc:1222

kaldi::nnet3::SpecAugmentTimeMaskComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:1993

kaldi::nnet3::ConstantComponent::Copy
virtual Component * Copy() const
Copies component (deep copy).
Definition: nnet-general-component.cc:1327

kaldi::swap
void swap(basic_filebuf< CharT, Traits > &x, basic_filebuf< CharT, Traits > &y)
Definition: basic-filebuf.h:275

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet3::ConstantComponent::Vectorize
virtual void Vectorize(VectorBase< BaseFloat > *params) const
Turns the parameters into vector form.
Definition: nnet-general-component.cc:1389

kaldi::nnet3::GeneralDropoutComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-general-component.h:889

kaldi::nnet3::SpecAugmentTimeMaskComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:1908

kaldi::nnet3::DistributeComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:239

kaldi::nnet3::OnlineNaturalGradient
Keywords for search: natural gradient, naturalgradient, NG-SGD.
Definition: natural-gradient-online.h:414

kaldi::CuMatrixBase::DivRowsVec
void DivRowsVec(const CuVectorBase< Real > &div)
divide i&#39;th row by scale[i]
Definition: cu-matrix.cc:899

kaldi::Matrix< BaseFloat >

kaldi::nnet3::StatisticsPoolingComponent::right_context_
int32 right_context_
Definition: nnet-general-component.h:416

kaldi::CuMatrixBase::AddMatMatElements
void AddMatMatElements(const Real alpha, const CuMatrixBase< Real > &A, const CuMatrixBase< Real > &B, const Real beta)
*this = beta * *this + alpha * A .* B (.* element by element multiplication)
Definition: cu-matrix.cc:1447

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::CuMatrixBase::CopyRowsFromVec
void CopyRowsFromVec(const CuVectorBase< Real > &v)
This function has two modes of operation.
Definition: cu-matrix.cc:2301

kaldi::nnet3::DistributeComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:228

kaldi::nnet3::MiscComputationInfo
Definition: nnet-computation.h:55

kaldi::nnet3::UpdatableComponent::max_change_
BaseFloat max_change_
configuration value for imposing max-change
Definition: nnet-component-itf.h:570

kaldi::nnet3::StatisticsPoolingComponent::IsComputable
virtual bool IsComputable(const MiscComputationInfo &misc_info, const Index &output_index, const IndexSet &input_index_set, std::vector< Index > *used_inputs) const
This function only does something interesting for non-simple Components, and it exists to make it pos...
Definition: nnet-general-component.cc:670

kaldi::nnet3::StatisticsPoolingComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:603

kaldi::nnet3::StatisticsExtractionComponent::StatisticsExtractionComponent
StatisticsExtractionComponent()
Definition: nnet-general-component.cc:354

kaldi::ReadIntegerPairVector
void ReadIntegerPairVector(std::istream &is, bool binary, std::vector< std::pair< T, T > > *v)
Function for reading STL vector of pairs of integer types.
Definition: io-funcs-inl.h:131

kaldi::nnet3::ConstantComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:1365

kaldi::nnet3::BackpropTruncationComponent::ZeroStats
virtual void ZeroStats()
Components that provide an implementation of StoreStats should also provide an implementation of Zero...
Definition: nnet-general-component.cc:1182

kaldi::nnet3::BackpropTruncationComponent::Add
virtual void Add(BaseFloat alpha, const Component &other)
This virtual function when called by – an UpdatableComponent adds the parameters of another updatabl...
Definition: nnet-general-component.cc:1198

kaldi::nnet3::StatisticsExtractionComponentPrecomputedIndexes::backward_indexes
CuArray< int32 > backward_indexes
Definition: nnet-general-component.h:292

kaldi::nnet3::SpecAugmentTimeMaskComponentPrecomputedIndexes::tot_size
int32 tot_size
Definition: nnet-general-component.h:1097

kaldi::nnet3::GeneralDropoutComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-general-component.cc:1596

kaldi::CuSubVector
Definition: matrix-common.h:73

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

kaldi::nnet3::ConstantComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:1233

kaldi::nnet3::GeneralDropoutComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:1636

kaldi::CuMatrixBase::CopyColFromVec
void CopyColFromVec(const CuVectorBase< Real > &v, const MatrixIndexT col)
Copy vector into specific column of matrix.
Definition: cu-matrix.cc:2414

kaldi::nnet3::ConstantComponent::PerturbParams
virtual void PerturbParams(BaseFloat stddev)
This function is to be used in testing.
Definition: nnet-general-component.cc:1350

kaldi::nnet3::BackpropTruncationComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:1020

kaldi::nnet3::SpecAugmentTimeMaskComponent
SpecAugmentTimeMaskComponent implements the time part of SpecAugment.
Definition: nnet-general-component.h:1017

kaldi::nnet3::StatisticsExtractionComponent::GetInputIndexes
virtual void GetInputIndexes(const MiscComputationInfo &misc_info, const Index &output_index, std::vector< Index > *desired_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-general-component.cc:430

kaldi::ExpectOneOrTwoTokens
void ExpectOneOrTwoTokens(std::istream &is, bool binary, const std::string &token1, const std::string &token2)
This function is like ExpectToken but for two tokens, and it will either accept token1 and then token...
Definition: text-utils.cc:536

kaldi::nnet3::StatisticsPoolingComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:777

kaldi::nnet3::SpecAugmentTimeMaskComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-general-component.cc:1931

kaldi::SameDim
bool SameDim(const MatrixBase< Real > &M, const MatrixBase< Real > &N)
Definition: kaldi-matrix.h:1111

kaldi::nnet3::Index::x
int32 x
Definition: nnet-common.h:47

kaldi::nnet3::SpecAugmentTimeMaskComponent::Copy
virtual Component * Copy() const
Copies component (deep copy).
Definition: nnet-general-component.cc:1989

kaldi::nnet3::GeneralDropoutComponent::GetMemo
CuMatrix< BaseFloat > * GetMemo(int32 num_mask_rows) const
Definition: nnet-general-component.cc:1739

kaldi::nnet3::StatisticsPoolingComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-general-component.h:350

kaldi::CuMatrixBase::Scale
void Scale(Real value)
Definition: cu-matrix.cc:644

kaldi::nnet3::GeneralDropoutComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:1703

kaldi::nnet3::ConstantComponent::DotProduct
virtual BaseFloat DotProduct(const UpdatableComponent &other) const
Computes dot-product between parameters of two instances of a Component.
Definition: nnet-general-component.cc:1356

kaldi::nnet3::StatisticsPoolingComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:555

kaldi::ConfigLine::UnusedValues
std::string UnusedValues() const
returns e.g.
Definition: text-utils.cc:518

kaldi::VectorBase::CopyFromVec
void CopyFromVec(const VectorBase< Real > &v)
Copy data from another vector (must match own size).
Definition: kaldi-vector.cc:228

kaldi::nnet3::ConstantComponent
Definition: nnet-general-component.h:628

kaldi::nnet3::SpecAugmentTimeMaskComponent::SpecAugmentTimeMaskComponent
SpecAugmentTimeMaskComponent()
Definition: nnet-general-component.cc:1898

kaldi::nnet3::BackpropTruncationComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:898

kaldi::nnet3::BackpropTruncationComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:1094

kaldi::ReadIntegerVector
void ReadIntegerVector(std::istream &is, bool binary, std::vector< T > *v)
Function for reading STL vector of integer types.
Definition: io-funcs-inl.h:232

kaldi::nnet3::ExpectToken
static void ExpectToken(const std::string &token, const std::string &what_we_are_parsing, const std::string **next_token)
Definition: nnet-descriptor.cc:45

kaldi::nnet3::BackpropTruncationComponentPrecomputedIndexes::Write
virtual void Write(std::ostream &ostream, bool binary) const
Definition: nnet-general-component.cc:957

kaldi::nnet3::StatisticsPoolingComponentPrecomputedIndexes::forward_indexes
CuArray< Int32Pair > forward_indexes
Definition: nnet-general-component.h:437

float

kaldi::nnet3::SpecAugmentTimeMaskComponent::zeroed_proportion_
BaseFloat zeroed_proportion_
Definition: nnet-general-component.h:1073

kaldi::nnet3::SpecAugmentTimeMaskComponent::time_mask_max_frames_
int32 time_mask_max_frames_
Definition: nnet-general-component.h:1075

kaldi::nnet3::StatisticsPoolingComponent::require_direct_input_
bool require_direct_input_
Definition: nnet-general-component.h:425

kaldi::nnet3::StatisticsPoolingComponentPrecomputedIndexes::backward_indexes
CuArray< Int32Pair > backward_indexes
Definition: nnet-general-component.h:446

kaldi::CuMatrixBase::Add
void Add(Real value)
Definition: cu-matrix.cc:582

kaldi::nnet3::StatisticsExtractionComponentPrecomputedIndexes::forward_indexes
CuArray< Int32Pair > forward_indexes
Definition: nnet-general-component.h:282

kaldi::nnet3::DropoutMaskComponent::continuous_
bool continuous_
Definition: nnet-general-component.h:794

kaldi::nnet3::DropoutMaskComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-general-component.h:745

kaldi::nnet3::StatisticsPoolingComponent::num_log_count_features_
int32 num_log_count_features_
Definition: nnet-general-component.h:417

kaldi::nnet3::RandomComponent::test_mode_
bool test_mode_
Definition: nnet-component-itf.h:426

kaldi::CuMatrixBase::SetZero
void SetZero()
Math operations, some calling kernels.
Definition: cu-matrix.cc:509

kaldi::nnet3::BackpropTruncationComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:932

kaldi::nnet3::SpecAugmentTimeMaskComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-general-component.cc:1889

kaldi::nnet3::BackpropTruncationComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-general-component.cc:1105

kaldi::CuMatrixBase::MulRows
void MulRows(const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Does for each row r, this.Row(r) *= alpha * src.row(indexes[r]), where &#39;*=&#39; is elementwise multiplica...
Definition: cu-matrix.cc:2790

kaldi::CuMatrixBase::MulElements
void MulElements(const CuMatrixBase< Real > &A)
Multiply two matrices elementwise: C = C .* A.
Definition: cu-matrix.cc:667

nnet-computation-graph.h

kaldi::nnet3::BackpropTruncationComponent
Definition: nnet-general-component.h:466

kaldi::nnet3::GeneralDropoutComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-general-component.cc:1810

kaldi::nnet3::BackpropTruncationComponent::Scale
virtual void Scale(BaseFloat scale)
This virtual function when called on – an UpdatableComponent scales the parameters by "scale" when c...
Definition: nnet-general-component.cc:1190

kaldi::CuMatrixBase::CopyRows
void CopyRows(const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Copies row r from row indexes[r] of src.
Definition: cu-matrix.cc:2678

kaldi::nnet3::UpdatableComponent::learning_rate_
BaseFloat learning_rate_
learning rate (typically 0.0..0.01)
Definition: nnet-component-itf.h:559

kaldi::nnet3::StatisticsPoolingComponent::variance_floor_
BaseFloat variance_floor_
Definition: nnet-general-component.h:419

rnnlm::n
struct rnnlm::@11::@12 n

kaldi::nnet3::StatisticsExtractionComponentPrecomputedIndexes::counts
CuVector< BaseFloat > counts
Definition: nnet-general-component.h:287

kaldi::nnet3::ConstantComponent::ConsolidateMemory
virtual void ConsolidateMemory()
This virtual function relates to memory management, and avoiding fragmentation.
Definition: nnet-general-component.cc:1397

kaldi::nnet3::DropoutMaskComponent
Definition: nnet-general-component.h:722

kaldi::nnet3::GeneralDropoutComponent::block_dim_
int32 block_dim_
Definition: nnet-general-component.h:937

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::nnet3::ConstantComponent::NumParameters
virtual int32 NumParameters() const
The following new virtual function returns the total dimension of the parameters in this class...
Definition: nnet-general-component.cc:1384

kaldi::nnet3::OnlineNaturalGradient::PreconditionDirections
void PreconditionDirections(CuMatrixBase< BaseFloat > *X, BaseFloat *scale)
This call implements the main functionality of this class.
Definition: natural-gradient-online.cc:159

kaldi::nnet3::ConstantComponent::Scale
virtual void Scale(BaseFloat scale)
This virtual function when called on – an UpdatableComponent scales the parameters by "scale" when c...
Definition: nnet-general-component.cc:1331

kaldi::nnet3::ConstantComponent::is_updatable_
bool is_updatable_
Definition: nnet-general-component.h:702

kaldi::nnet3::GeneralDropoutComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-general-component.cc:1529

kaldi::nnet3::BackpropTruncationComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-general-component.cc:981

kaldi::nnet3::UpdatableComponent::learning_rate_factor_
BaseFloat learning_rate_factor_
learning rate factor (normally 1.0, but can be set to another < value so that when < you call SetLear...
Definition: nnet-component-itf.h:560

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

kaldi::nnet3::StatisticsExtractionComponentPrecomputedIndexes::Read
virtual void Read(std::istream &is, bool binary)
Definition: nnet-general-component.cc:272

kaldi::CuVectorBase::ApplyExp
void ApplyExp()
Definition: cu-vector.cc:442

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::nnet3::IndexLessNxt
Definition: nnet-common.h:90

kaldi::nnet3::StatisticsExtractionComponentPrecomputedIndexes::Write
virtual void Write(std::ostream &os, bool binary) const
Definition: nnet-general-component.cc:257

nnet-parse.h

kaldi::VectorBase::Scale
void Scale(Real alpha)
Multiplies all elements by this constant.
Definition: kaldi-vector.cc:963

kaldi::PeekToken
int PeekToken(std::istream &is, bool binary)
PeekToken will return the first character of the next token, or -1 if end of file.
Definition: io-funcs.cc:170

kaldi::nnet3::OnlineNaturalGradient::Swap
void Swap(OnlineNaturalGradient *other)
Definition: natural-gradient-online.cc:628

kaldi::VectorBase::Sum
Real Sum() const
Returns sum of the elements.
Definition: kaldi-vector.cc:688

kaldi::VectorBase::SetRandn
void SetRandn()
Set vector to random normally-distributed noise.
Definition: kaldi-vector.cc:301

kaldi::nnet3::StatisticsPoolingComponent::StatisticsPoolingComponent
StatisticsPoolingComponent()
Definition: nnet-general-component.cc:575

kaldi::nnet3::StatisticsExtractionComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:503

kaldi::nnet3::BackpropTruncationComponent::count_zeroing_boundaries_
double count_zeroing_boundaries_
Definition: nnet-general-component.h:563

kaldi::nnet3::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters; it extends the interface of C...
Definition: nnet-component-itf.h:455

kaldi::CuVectorBase::SetRandn
void SetRandn()
Definition: cu-vector.cc:281

kaldi::nnet3::SpecAugmentTimeMaskComponentPrecomputedIndexes::Write
virtual void Write(std::ostream &os, bool binary) const
Definition: nnet-general-component.cc:2094

kaldi::nnet3::GeneralDropoutComponent::specaugment_max_regions_
int32 specaugment_max_regions_
Definition: nnet-general-component.h:949

kaldi::nnet3::StatisticsExtractionComponent::IsComputable
virtual bool IsComputable(const MiscComputationInfo &misc_info, const Index &output_index, const IndexSet &input_index_set, std::vector< Index > *used_inputs) const
This function only does something interesting for non-simple Components, and it exists to make it pos...
Definition: nnet-general-component.cc:398

kaldi::nnet3::StatisticsPoolingComponentPrecomputedIndexes::Read
virtual void Read(std::istream &is, bool binary)
Definition: nnet-general-component.cc:542

kaldi::CuMatrixBase::Data
const Real * Data() const
Return data pointer (const).
Definition: cu-matrix.h:746

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::GeneralDropoutComponentPrecomputedIndexes::num_mask_rows
int32 num_mask_rows
Definition: nnet-general-component.h:970

kaldi::nnet3::DistributeComponentPrecomputedIndexes::Write
virtual void Write(std::ostream &ostream, bool binary) const
Definition: nnet-general-component.cc:88

kaldi::nnet3::StatisticsExtractionComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:448

kaldi::CuMatrixBase::ColRange
CuSubMatrix< Real > ColRange(const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Definition: cu-matrix.h:665

kaldi::nnet3::StatisticsExtractionComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:367

kaldi::nnet3::BackpropTruncationComponent::num_zeroed_
double num_zeroed_
Definition: nnet-general-component.h:561

kaldi::nnet3::StatisticsPoolingComponent::input_period_
int32 input_period_
Definition: nnet-general-component.h:414

kaldi::nnet3::GeneralDropoutComponent
GeneralDropoutComponent implements dropout, including a continuous variant where the thing we multipl...
Definition: nnet-general-component.h:875

kaldi::nnet3::GeneralDropoutComponentPrecomputedIndexes::Write
virtual void Write(std::ostream &os, bool binary) const
Definition: nnet-general-component.cc:1865

kaldi::nnet3::StatisticsExtractionComponent::OutputDim
virtual int32 OutputDim() const
Returns output-dimension of this component.
Definition: nnet-general-component.h:210

kaldi::nnet3::ConstantComponent::UnVectorize
virtual void UnVectorize(const VectorBase< BaseFloat > &params)
Converts the parameters from vector form.
Definition: nnet-general-component.cc:1393

kaldi::nnet3::ConstantComponent::output_
CuVector< BaseFloat > output_
Definition: nnet-general-component.h:700

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::nnet3::StatisticsPoolingComponent::input_dim_
int32 input_dim_
Definition: nnet-general-component.h:413

kaldi::nnet3::DistributeComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:180

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::nnet3::DropoutMaskComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:1421

kaldi::nnet3::ComponentPrecomputedIndexes
Definition: nnet-component-itf.h:97

kaldi::nnet3::DistributeComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-general-component.cc:102

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::nnet3::StatisticsPoolingComponent::GetInputIndexes
virtual void GetInputIndexes(const MiscComputationInfo &misc_info, const Index &output_index, std::vector< Index > *desired_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-general-component.cc:654

kaldi::nnet3::StatisticsPoolingComponent::ReorderIndexes
virtual void ReorderIndexes(std::vector< Index > *input_indexes, std::vector< Index > *output_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-general-component.cc:645

kaldi::nnet3::DropoutMaskComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:1478

kaldi::ConfigLine
This class is responsible for parsing input like hi-there xx=yyy a=b c empty= f-oo=Append(bar, sss) ba_z=123 bing=&#39;a b c&#39; baz="a b c d=&#39;a b&#39; e" and giving you access to the fields, in this case.
Definition: text-utils.h:205

kaldi::nnet3::BackpropTruncationComponent::clipping_threshold_
BaseFloat clipping_threshold_
Definition: nnet-general-component.h:536

kaldi::nnet3::DistributeComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:248

kaldi::nnet3::UpdatableComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-component-itf.cc:333

kaldi::nnet3::UpdatableComponent::is_gradient_
bool is_gradient_
True if this component is to be treated as a gradient rather than as parameters.
Definition: nnet-component-itf.h:566

kaldi::nnet3::StatisticsExtractionComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-general-component.cc:289

kaldi::CuArray< Int32Pair >

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet3::UpdatableComponent::WriteUpdatableCommon
void WriteUpdatableCommon(std::ostream &is, bool binary) const
Definition: nnet-component-itf.cc:306

kaldi::nnet3::DistributeComponent::GetInputIndexes
virtual void GetInputIndexes(const MiscComputationInfo &misc_info, const Index &output_index, std::vector< Index > *desired_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-general-component.cc:63

kaldi::nnet3::DistributeComponent::Init
void Init(int32 input_dim, int32 output_dim)
Definition: nnet-general-component.cc:221

NVTX_RANGE
#define NVTX_RANGE(name)
Definition: cu-common.h:143

kaldi::nnet3::ConstantComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-general-component.cc:1275

kaldi::CuVectorBase::Data
Real * Data()
Returns a pointer to the start of the vector&#39;s data.
Definition: cu-vector.h:72

kaldi::CuVectorBase::Scale
void Scale(Real value)
Definition: cu-vector.cc:1216

kaldi::WriteIntegerVector
void WriteIntegerVector(std::ostream &os, bool binary, const std::vector< T > &v)
Function for writing STL vectors of integer types.
Definition: io-funcs-inl.h:198

kaldi::ConfigLine::HasUnusedValues
bool HasUnusedValues() const
Definition: text-utils.cc:510

kaldi::ConfigLine::GetValue
bool GetValue(const std::string &key, std::string *value)
Definition: text-utils.cc:427

kaldi::nnet3::ConstantComponent::preconditioner_
OnlineNaturalGradient preconditioner_
Definition: nnet-general-component.h:705

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet3::ConstantComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:1316

kaldi::nnet3::BackpropTruncationComponent::dim_
int32 dim_
Definition: nnet-general-component.h:527

kaldi::nnet3::DropoutMaskComponent::output_dim_
int32 output_dim_
Definition: nnet-general-component.h:790

Int32Pair
Definition: cu-matrixdim.h:78

kaldi::nnet3::GeneralDropoutComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-general-component.cc:1562

kaldi::nnet3::DistributeComponentPrecomputedIndexes::Read
virtual void Read(std::istream &istream, bool binary)
Definition: nnet-general-component.cc:95

kaldi::nnet3::DistributeComponent::output_dim_
int32 output_dim_
Definition: nnet-general-component.h:129

kaldi::nnet3::BackpropTruncationComponentPrecomputedIndexes::zeroing
CuVector< BaseFloat > zeroing
Definition: nnet-general-component.h:577

Int32Pair::second
int32_cuda second
Definition: cu-matrixdim.h:80

kaldi::CuMatrixBase::CopyToRows
void CopyToRows(const CuArrayBase< Real *> &dst) const
For each row r of this matrix, copies it to the array of floats at the location given by dst[r]...
Definition: cu-matrix.cc:2744

kaldi::nnet3::ConstantComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-general-component.cc:1241

kaldi::nnet3::DropoutMaskComponent::Copy
virtual Component * Copy() const
Copies component (deep copy).
Definition: nnet-general-component.cc:1512

kaldi::nnet3::PrintParameterStats
void PrintParameterStats(std::ostringstream &os, const std::string &name, const CuVectorBase< BaseFloat > &params, bool include_mean)
Print to &#39;os&#39; some information about the mean and standard deviation of some parameters, used in Info() functions in nnet-simple-component.cc.
Definition: nnet-parse.cc:157

kaldi::nnet3::StatisticsPoolingComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-general-component.cc:708

kaldi::nnet3::StatisticsExtractionComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:517

kaldi::nnet3::Index::t
int32 t
Definition: nnet-common.h:46

kaldi::nnet3::StatisticsExtractionComponent::input_period_
int32 input_period_
Definition: nnet-general-component.h:271

kaldi::nnet3::BackpropTruncationComponent::Copy
virtual Component * Copy() const
Copies component (deep copy).
Definition: nnet-general-component.cc:1042

kaldi::nnet3::DropoutMaskComponent::DropoutMaskComponent
DropoutMaskComponent()
Definition: nnet-general-component.cc:1412

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::VectorBase::Add
void Add(Real c)
Add a constant to each element of a vector.
Definition: kaldi-vector.cc:956

kaldi::CuArrayBase::Dim
MatrixIndexT Dim() const
Return the vector dimension.
Definition: cu-array.h:49

kaldi::nnet3::StatisticsPoolingComponent
Definition: nnet-general-component.h:337

kaldi::nnet3::ConstantComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-general-component.h:647

kaldi::nnet3::DistributeComponentPrecomputedIndexes::pairs
std::vector< std::pair< int32, int32 > > pairs
Definition: nnet-general-component.h:140

kaldi::nnet3::GeneralDropoutComponent::specaugment_max_proportion_
BaseFloat specaugment_max_proportion_
Definition: nnet-general-component.h:947

kaldi::nnet3::DistributeComponentPrecomputedIndexes
Definition: nnet-general-component.h:133

kaldi::VecVec
Real VecVec(const VectorBase< Real > &a, const VectorBase< Real > &b)
Returns dot product between v1 and v2.
Definition: kaldi-vector.cc:37

kaldi::nnet3::ConstantComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-general-component.cc:1210

kaldi::CuMatrixBase::Set
void Set(Real value)
Definition: cu-matrix.cc:531

kaldi::nnet3::RandomComponent::random_generator_
CuRand< BaseFloat > random_generator_
Definition: nnet-component-itf.h:422

kaldi::CuMatrixBase::MulRowsVec
void MulRowsVec(const CuVectorBase< Real > &scale)
scale i&#39;th row by scale[i]
Definition: cu-matrix.cc:792

kaldi::nnet3::GeneralDropoutComponent::Copy
virtual Component * Copy() const
Copies component (deep copy).
Definition: nnet-general-component.cc:1699

kaldi::nnet3::GeneralDropoutComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-general-component.cc:1674

kaldi::nnet3::StatisticsExtractionComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-general-component.cc:477

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501

kaldi::nnet3::DistributeComponent::ComputeInputPointers
void ComputeInputPointers(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, int32 num_output_rows, std::vector< const BaseFloat *> *input_pointers) const
Definition: nnet-general-component.cc:134

nnet-general-component.h
This file contains declarations of components that are not "simple", meaning they care about the inde...

kaldi::nnet3::StatisticsPoolingComponentPrecomputedIndexes::Write
virtual void Write(std::ostream &os, bool binary) const
Definition: nnet-general-component.cc:530

kaldi::nnet3::StatisticsExtractionComponent::Check
void Check() const
Definition: nnet-general-component.cc:383

kaldi::nnet3::BackpropTruncationComponent::num_clipped_
double num_clipped_
Definition: nnet-general-component.h:560

kaldi::nnet3::DropoutMaskComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-general-component.cc:1516

kaldi::nnet3::StatisticsExtractionComponent::Type
virtual std::string Type() const
Returns a string such as "SigmoidComponent", describing the type of the object.
Definition: nnet-general-component.h:215

kaldi::nnet3::StatisticsPoolingComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-general-component.cc:826

kaldi::MatrixBase::Set
void Set(Real)
Sets all elements to a specific value.
Definition: kaldi-matrix.cc:1339

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95

kaldi::nnet3::GeneralDropoutComponent::GeneralDropoutComponent
GeneralDropoutComponent()
Definition: nnet-general-component.cc:1545

kaldi::nnet3::GeneralDropoutComponent::time_period_
int32 time_period_
Definition: nnet-general-component.h:943

kaldi::PairHasher
A hashing function-object for pairs of ints.
Definition: stl-utils.h:235

kaldi::nnet3::StatisticsExtractionComponentPrecomputedIndexes
Definition: nnet-general-component.h:276

Int32Pair::first
int32_cuda first
Definition: cu-matrixdim.h:79