doc/nnet-convolutional-component_8cc_source.html

 // nnet3/nnet-convolutional-component.cc

 // Copyright      2017  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <iterator>
 #include <sstream>
 #include <iomanip>
 #include "nnet3/nnet-convolutional-component.h"
 #include "nnet3/nnet-computation-graph.h"
 #include "nnet3/nnet-parse.h"

 namespace kaldi {
 namespace nnet3 {


 TimeHeightConvolutionComponent::TimeHeightConvolutionComponent():
     use_natural_gradient_(true) { }

 TimeHeightConvolutionComponent::TimeHeightConvolutionComponent(
     const TimeHeightConvolutionComponent &other):
     UpdatableComponent(other),  // initialize base-class
     model_(other.model_),
     all_time_offsets_(other.all_time_offsets_),
     time_offset_required_(other.time_offset_required_),
     linear_params_(other.linear_params_),
     bias_params_(other.bias_params_),
     max_memory_mb_(other.max_memory_mb_),
     use_natural_gradient_(other.use_natural_gradient_),
     preconditioner_in_(other.preconditioner_in_),
     preconditioner_out_(other.preconditioner_out_) {
   Check();
 }


 void TimeHeightConvolutionComponent::Check() const {
   model_.Check();
   KALDI_ASSERT(bias_params_.Dim() == model_.num_filters_out &&
                linear_params_.NumRows() == model_.ParamRows() &&
                linear_params_.NumCols() == model_.ParamCols());
 }

 int32 TimeHeightConvolutionComponent::InputDim() const {
   return model_.InputDim();
 }

 int32 TimeHeightConvolutionComponent::OutputDim() const {
   return model_.OutputDim();
 }

 std::string TimeHeightConvolutionComponent::Info() const {
   std::ostringstream stream;
   // The output of model_.Info() has been designed to be suitable
   // as a component-level info string, it has
   // {num-filters,height}-{in-out}, offsets=[...], required-time-offsets=[...],
   // {input,output}-dim.
   stream << UpdatableComponent::Info() << ' ' << model_.Info();
   PrintParameterStats(stream, "filter-params", linear_params_);
   PrintParameterStats(stream, "bias-params", bias_params_, true);
   stream << ", num-params=" << NumParameters()
          << ", max-memory-mb=" << max_memory_mb_
          << ", use-natural-gradient=" << use_natural_gradient_;
   if (use_natural_gradient_) {
     stream << ", num-minibatches-history="
            << preconditioner_in_.GetNumMinibatchesHistory()
            << ", rank-in=" << preconditioner_in_.GetRank()
            << ", rank-out=" << preconditioner_out_.GetRank()
            << ", alpha=" << preconditioner_in_.GetAlpha();
   }
   return stream.str();
 }


 void TimeHeightConvolutionComponent::InitUnit() {
   if (model_.num_filters_in != model_.num_filters_out) {
     KALDI_ERR << "You cannot specify init-unit if the num-filters-in "
               << "and num-filters-out differ.";
   }
   size_t i;
   int32 zero_offset = 0;
   for (i = 0; i < model_.offsets.size(); i++) {
     if (model_.offsets[i].time_offset == 0 &&
         model_.offsets[i].height_offset == 0) {
       zero_offset = i;
       break;
     }
   }
   if (i == model_.offsets.size())  // did not break.
     KALDI_ERR << "You cannot specify init-unit if the model does "
               << "not have the offset (0, 0).";

   CuSubMatrix<BaseFloat> zero_offset_block(
       linear_params_, 0, linear_params_.NumRows(),
       zero_offset * model_.num_filters_in, model_.num_filters_in);

   KALDI_ASSERT(zero_offset_block.NumRows() == zero_offset_block.NumCols());
   zero_offset_block.AddToDiag(1.0);  // set this block to the unit matrix.
 }

 void TimeHeightConvolutionComponent::InitFromConfig(ConfigLine *cfl) {
   // 1. Config values inherited from UpdatableComponent.
   InitLearningRatesFromConfig(cfl);

   // 2. convolution-related config values.
   model_.height_subsample_out = 1;  // default.
   max_memory_mb_ = 200.0;
   std::string height_offsets, time_offsets, required_time_offsets = "undef",
       offsets;

   bool ok = cfl->GetValue("num-filters-in", &model_.num_filters_in) &&
       cfl->GetValue("num-filters-out", &model_.num_filters_out) &&
       cfl->GetValue("height-in", &model_.height_in) &&
       cfl->GetValue("height-out", &model_.height_out);
   if (!ok) {
     KALDI_ERR << "Bad initializer: expected all the values "
         "num-filters-in, num-filters-out, height-in, height-out, "
         "to be defined: "
               << cfl->WholeLine();
   }
   // some optional structural configs.
   cfl->GetValue("required-time-offsets", &required_time_offsets);
   cfl->GetValue("height-subsample-out", &model_.height_subsample_out);
   cfl->GetValue("max-memory-mb", &max_memory_mb_);
   KALDI_ASSERT(max_memory_mb_ > 0.0);

   { // This block sets up model_.offsets.
     model_.offsets.clear();
     if (cfl->GetValue("offsets", &offsets)) {
       // init from offsets, like "-1,-1;-1,0;-1,1;0,-1;...;1,1"
       std::vector<std::string> splits;
       SplitStringToVector(offsets, ";", false, &splits);
       for (size_t i = 0; i < splits.size(); i++) {
         std::vector<int32> int_pair;
         if (!SplitStringToIntegers(splits[i], ",", false, &int_pair) ||
             int_pair.size() != 2)
           KALDI_ERR << "Bad config value offsets=" << offsets;
         time_height_convolution::ConvolutionModel::Offset offset;
         offset.time_offset = int_pair[0];
         offset.height_offset = int_pair[1];
         model_.offsets.push_back(offset);
       }
       std::sort(model_.offsets.begin(), model_.offsets.end());
       if (!IsSortedAndUniq(model_.offsets) || model_.offsets.empty())
         KALDI_ERR << "Error in offsets: probably repeated offset.  "
             "offsets=" << offsets;
     } else if (cfl->GetValue("height-offsets", &height_offsets) &&
                cfl->GetValue("time-offsets", &time_offsets)) {
       std::vector<int32> height_offsets_vec,
           time_offsets_vec;
       if (!SplitStringToIntegers(height_offsets, ",", false,
                                  &height_offsets_vec) ||
           !SplitStringToIntegers(time_offsets, ",", false,
                                  &time_offsets_vec)) {
         KALDI_ERR << "Formatting problem in time-offsets or height-offsets: "
                   << cfl->WholeLine();
       }
       if (height_offsets_vec.empty() || !IsSortedAndUniq(height_offsets_vec) ||
           time_offsets_vec.empty() || !IsSortedAndUniq(time_offsets_vec)) {
         KALDI_ERR << "time-offsets and height-offsets must be nonempty, "
             "sorted and unique.";
       }
       model_.offsets.clear();
       for (size_t i = 0; i < time_offsets_vec.size(); i++) {
         for (size_t j = 0; j < height_offsets_vec.size(); j++) {
           time_height_convolution::ConvolutionModel::Offset offset;
           offset.time_offset = time_offsets_vec[i];
           offset.height_offset = height_offsets_vec[j];
           model_.offsets.push_back(offset);
         }
       }
     } else {
       KALDI_ERR << "Expected either 'offsets', or both 'height-offsets' and "
           "'time-offsets', to be defined: " << cfl->WholeLine();
     }
   }

   if (model_.offsets.empty())
     KALDI_ERR << "Something went wrong setting offsets: " << cfl->WholeLine();


   {  // This block sets model_.required_time_offsets.
     std::vector<int32> required_time_offsets_vec;
     if (required_time_offsets == "undef") {
       // it defaults to all the time offsets that were used.
       std::set<int32> required_time_offsets;
       for (size_t i = 0; i < model_.offsets.size(); i++)
         required_time_offsets_vec.push_back(model_.offsets[i].time_offset);
       SortAndUniq(&required_time_offsets_vec);
     } else {
       if (!SplitStringToIntegers(required_time_offsets, ",", false,
                                  &required_time_offsets_vec) ||
           required_time_offsets_vec.empty() ||
           !IsSortedAndUniq(required_time_offsets_vec)) {
         KALDI_ERR << "Formatting problem in required-time-offsets: "
                 << cfl->WholeLine();
       }
     }
     model_.required_time_offsets.clear();
     model_.required_time_offsets.insert(
         required_time_offsets_vec.begin(),
         required_time_offsets_vec.end());
   }

   model_.ComputeDerived();
   if (!model_.Check(false, true)) {
     KALDI_ERR << "Parameters used to initialize TimeHeightConvolutionComponent "
               << "do not make sense,  line was: " << cfl->WholeLine();
   }
   if (!model_.Check(true, true)) {
     KALDI_WARN << "There are input heights unused in "
         "TimeHeightConvolutionComponent; consider increasing output "
         "height or decreasing height of preceding layer."
                << cfl->WholeLine();
   }

   // 3. Parameter-initialization configs.
   BaseFloat param_stddev = -1, bias_stddev = 0.0;
   bool init_unit = false;
   cfl->GetValue("param-stddev", &param_stddev);
   cfl->GetValue("bias-stddev", &bias_stddev);
   cfl->GetValue("init-unit", &init_unit);
   if (param_stddev < 0.0) {
     param_stddev = 1.0 / sqrt(model_.num_filters_in *
                               model_.offsets.size());
   }
   // initialize the parameters.
   linear_params_.Resize(model_.ParamRows(), model_.ParamCols());
   if (!init_unit) {
     linear_params_.SetRandn();
     linear_params_.Scale(param_stddev);
   } else {
     InitUnit();
   }
   bias_params_.Resize(model_.num_filters_out);
   bias_params_.SetRandn();
   bias_params_.Scale(bias_stddev);


   // 4. Natural-gradient related configs.
   use_natural_gradient_ = true;
   int32 rank_out = -1, rank_in = -1;
   BaseFloat alpha_out = 4.0, alpha_in = 4.0,
       num_minibatches_history = 4.0;
   cfl->GetValue("use-natural-gradient", &use_natural_gradient_);
   cfl->GetValue("rank-in", &rank_in);
   cfl->GetValue("rank-out", &rank_out);
   cfl->GetValue("alpha-in", &alpha_in);
   cfl->GetValue("alpha-out", &alpha_out);
   cfl->GetValue("num-minibatches-history", &num_minibatches_history);

   int32 dim_in = linear_params_.NumCols() + 1,
       dim_out = linear_params_.NumRows();
   if (rank_in < 0)
     rank_in = std::min<int32>(80, (dim_in + 1) / 2);
   preconditioner_in_.SetRank(rank_in);
   if (rank_out < 0)
     rank_out = std::min<int32>(80, (dim_out + 1) / 2);
   preconditioner_out_.SetRank(rank_out);
   preconditioner_in_.SetNumMinibatchesHistory(num_minibatches_history);
   preconditioner_out_.SetNumMinibatchesHistory(num_minibatches_history);

   preconditioner_in_.SetAlpha(alpha_in);
   preconditioner_out_.SetAlpha(alpha_out);

   ComputeDerived();
 }

 void* TimeHeightConvolutionComponent::Propagate(
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in,
     CuMatrixBase<BaseFloat> *out) const {
   const PrecomputedIndexes *indexes =
       dynamic_cast<const PrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL);
   { // this block handles the bias term.
     KALDI_ASSERT(out->Stride() == out->NumCols() &&
                  out->NumCols() == model_.height_out * model_.num_filters_out);
     CuSubMatrix<BaseFloat> out_reshaped(
         out->Data(), out->NumRows() * model_.height_out,
         model_.num_filters_out, model_.num_filters_out);
     out_reshaped.CopyRowsFromVec(bias_params_);
   }
   ConvolveForward(indexes->computation, in, linear_params_, out);
   return NULL;
 }

 void TimeHeightConvolutionComponent::Backprop(
     const std::string &debug_info,
     const ComponentPrecomputedIndexes *indexes_in,
     const CuMatrixBase<BaseFloat> &in_value,
     const CuMatrixBase<BaseFloat> &, // out_value
     const CuMatrixBase<BaseFloat> &out_deriv,
     void*, // memo
     Component *to_update_in,
     CuMatrixBase<BaseFloat> *in_deriv) const {
   NVTX_RANGE("TimeHeightConvolutionComponent::Backprop");
   const PrecomputedIndexes *indexes =
       dynamic_cast<const PrecomputedIndexes*>(indexes_in);
   KALDI_ASSERT(indexes != NULL);

   if (in_deriv != NULL) {
     ConvolveBackwardData(indexes->computation, linear_params_,
                          out_deriv, in_deriv);
   }
   if (to_update_in != NULL) {
     TimeHeightConvolutionComponent *to_update =
         dynamic_cast<TimeHeightConvolutionComponent*>(to_update_in);
     KALDI_ASSERT(to_update != NULL);

     if (to_update->learning_rate_ == 0.0)
       return;

     if (to_update->is_gradient_ || !to_update->use_natural_gradient_)
       to_update->UpdateSimple(*indexes, in_value, out_deriv);
     else
       to_update->UpdateNaturalGradient(*indexes, in_value, out_deriv);
   }
 }

 void TimeHeightConvolutionComponent::UpdateSimple(
     const PrecomputedIndexes &indexes,
     const CuMatrixBase<BaseFloat> &in_value,
     const CuMatrixBase<BaseFloat> &out_deriv) {

   { // this block handles the bias term.
     KALDI_ASSERT(out_deriv.Stride() == out_deriv.NumCols() &&
                  out_deriv.NumCols() ==
                  model_.height_out * model_.num_filters_out);
     CuSubMatrix<BaseFloat> out_deriv_reshaped(
         out_deriv.Data(), out_deriv.NumRows() * model_.height_out,
         model_.num_filters_out, model_.num_filters_out);
     bias_params_.AddRowSumMat(learning_rate_, out_deriv_reshaped);
   }

   ConvolveBackwardParams(indexes.computation, in_value, out_deriv,
                          learning_rate_, &linear_params_);
 }


 void TimeHeightConvolutionComponent::UpdateNaturalGradient(
     const PrecomputedIndexes &indexes,
     const CuMatrixBase<BaseFloat> &in_value,
     const CuMatrixBase<BaseFloat> &out_deriv) {

   CuVector<BaseFloat> bias_deriv(bias_params_.Dim());

   { // this block computes 'bias_deriv', the derivative w.r.t. the bias.
     KALDI_ASSERT(out_deriv.Stride() == out_deriv.NumCols() &&
                  out_deriv.NumCols() ==
                  model_.height_out * model_.num_filters_out);
     CuSubMatrix<BaseFloat> out_deriv_reshaped(
         out_deriv.Data(), out_deriv.NumRows() * model_.height_out,
         model_.num_filters_out, model_.num_filters_out);
     bias_deriv.AddRowSumMat(1.0, out_deriv_reshaped);
   }

   CuMatrix<BaseFloat> params_deriv(linear_params_.NumRows(),
                                   linear_params_.NumCols() + 1);
   params_deriv.CopyColFromVec(bias_deriv, linear_params_.NumCols());


   CuSubMatrix<BaseFloat> linear_params_deriv(
       params_deriv, 0, linear_params_.NumRows(),
       0, linear_params_.NumCols());

   ConvolveBackwardParams(indexes.computation, in_value, out_deriv,
                          1.0, &linear_params_deriv);

   // the precondition-directions code outputs a scalar that
   // must be multiplied by its output (this saves one
   // CUDA operation internally).
   // We don't bother applying this scale before doing the other
   // dimenson of natural gradient, because although it's not
   // invariant to scalar multiplication of the input if the
   // scalars are different across iterations, the scalars
   // will be pretty similar on different iterations
   BaseFloat scale1, scale2;
   preconditioner_in_.PreconditionDirections(&params_deriv, &scale1);


   CuMatrix<BaseFloat> params_deriv_transpose(params_deriv, kTrans);
   preconditioner_out_.PreconditionDirections(&params_deriv_transpose, &scale2);

   linear_params_.AddMat(
       learning_rate_ * scale1 * scale2,
       params_deriv_transpose.RowRange(0, linear_params_.NumCols()),
       kTrans);

   bias_params_.AddVec(learning_rate_ * scale1 * scale2,
                       params_deriv_transpose.Row(linear_params_.NumCols()));
 }


 void TimeHeightConvolutionComponent::ReorderIndexes(
     std::vector<Index> *input_indexes,
     std::vector<Index> *output_indexes) const {
   using namespace time_height_convolution;
   ConvolutionComputationOptions opts;
   opts.max_memory_mb = max_memory_mb_;
   ConvolutionComputation computation_temp;
   std::vector<Index> input_indexes_modified,
       output_indexes_modified;
   CompileConvolutionComputation(
       model_, *input_indexes, *output_indexes, opts,
       &computation_temp, &input_indexes_modified, &output_indexes_modified);
   input_indexes->swap(input_indexes_modified);
   output_indexes->swap(output_indexes_modified);
 }

 void TimeHeightConvolutionComponent::Write(std::ostream &os, bool binary) const {
   WriteUpdatableCommon(os, binary);  // Write opening tag and learning rate.
   WriteToken(os, binary, "<Model>");
   model_.Write(os, binary);
   WriteToken(os, binary, "<LinearParams>");
   linear_params_.Write(os, binary);
   WriteToken(os, binary, "<BiasParams>");
   bias_params_.Write(os, binary);
   WriteToken(os, binary, "<MaxMemoryMb>");
   WriteBasicType(os, binary, max_memory_mb_);
   WriteToken(os, binary, "<UseNaturalGradient>");
   WriteBasicType(os, binary, use_natural_gradient_);
   int32 rank_in = preconditioner_in_.GetRank(),
       rank_out = preconditioner_out_.GetRank();
   BaseFloat alpha_in = preconditioner_in_.GetAlpha(),
       alpha_out = preconditioner_out_.GetAlpha(),
       num_minibatches_history = preconditioner_in_.GetNumMinibatchesHistory();
   WriteToken(os, binary, "<NumMinibatchesHistory>");
   WriteBasicType(os, binary, num_minibatches_history);
   WriteToken(os, binary, "<AlphaInOut>");
   WriteBasicType(os, binary, alpha_in);
   WriteBasicType(os, binary, alpha_out);
   WriteToken(os, binary, "<RankInOut>");
   WriteBasicType(os, binary, rank_in);
   WriteBasicType(os, binary, rank_out);
   WriteToken(os, binary, "</TimeHeightConvolutionComponent>");
 }

 void TimeHeightConvolutionComponent::Read(std::istream &is, bool binary) {
   std::string token = ReadUpdatableCommon(is, binary);
   // the next few lines are only for back compatibility.
   if (token != "") {
     KALDI_ASSERT(token == "<Model>");
   } else {
     ExpectToken(is, binary, "<Model>");
   }
   model_.Read(is, binary);
   ExpectToken(is, binary, "<LinearParams>");
   linear_params_.Read(is, binary);
   ExpectToken(is, binary, "<BiasParams>");
   bias_params_.Read(is, binary);
   ExpectToken(is, binary, "<MaxMemoryMb>");
   ReadBasicType(is, binary, &max_memory_mb_);
   ExpectToken(is, binary, "<UseNaturalGradient>");
   ReadBasicType(is, binary, &use_natural_gradient_);
   int32 rank_in,  rank_out;
   BaseFloat alpha_in, alpha_out,
       num_minibatches_history;
   ExpectToken(is, binary, "<NumMinibatchesHistory>");
   ReadBasicType(is, binary, &num_minibatches_history);
   ExpectToken(is, binary, "<AlphaInOut>");
   ReadBasicType(is, binary, &alpha_in);
   ReadBasicType(is, binary, &alpha_out);
   preconditioner_in_.SetAlpha(alpha_in);
   preconditioner_out_.SetAlpha(alpha_out);
   ExpectToken(is, binary, "<RankInOut>");
   ReadBasicType(is, binary, &rank_in);
   ReadBasicType(is, binary, &rank_out);
   preconditioner_in_.SetRank(rank_in);
   preconditioner_out_.SetRank(rank_out);
   preconditioner_in_.SetNumMinibatchesHistory(num_minibatches_history);
   preconditioner_out_.SetNumMinibatchesHistory(num_minibatches_history);
   ExpectToken(is, binary, "</TimeHeightConvolutionComponent>");
   ComputeDerived();
   Check();
 }

 void TimeHeightConvolutionComponent::ComputeDerived() {
   all_time_offsets_.clear();
   all_time_offsets_.insert(
       all_time_offsets_.end(),
       model_.all_time_offsets.begin(),
       model_.all_time_offsets.end());
   time_offset_required_.resize(all_time_offsets_.size());
   for (size_t i = 0; i < all_time_offsets_.size(); i++) {
     time_offset_required_[i] =
         (model_.required_time_offsets.count(all_time_offsets_[i]) > 0);
   }
 }

 void TimeHeightConvolutionComponent::GetInputIndexes(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     std::vector<Index> *desired_indexes) const {
   KALDI_ASSERT(output_index.t != kNoTime);
   size_t size = all_time_offsets_.size();
   desired_indexes->resize(size);
   for (size_t i = 0; i < size; i++) {
     (*desired_indexes)[i].n = output_index.n;
     (*desired_indexes)[i].t = output_index.t + all_time_offsets_[i];
     (*desired_indexes)[i].x = output_index.x;
   }
 }


 bool TimeHeightConvolutionComponent::IsComputable(
     const MiscComputationInfo &misc_info,
     const Index &output_index,
     const IndexSet &input_index_set,
     std::vector<Index> *used_inputs) const {
   KALDI_ASSERT(output_index.t != kNoTime);
   size_t size = all_time_offsets_.size();
   Index index(output_index);
   if (used_inputs != NULL) {
     used_inputs->clear();
     used_inputs->reserve(size);
     for (size_t i = 0; i < size; i++) {
       index.t = output_index.t + all_time_offsets_[i];
       if (input_index_set(index)) {
         // This input index is available.
         used_inputs->push_back(index);
       } else {
         // This input index is not available.
         if (time_offset_required_[i]) {
           // A required offset was not present -> this output index is not
           // computable.
           used_inputs->clear();
           return false;
         }
       }
     }
     // All required time-offsets of the output were computable. -> return true.
     return true;
   } else {
     for (size_t i = 0; i < size; i++) {
       if (time_offset_required_[i]) {
         index.t = output_index.t + all_time_offsets_[i];
         if (!input_index_set(index))
           return false;
       }
     }
     return true;
   }
 }


 ComponentPrecomputedIndexes* TimeHeightConvolutionComponent::PrecomputeIndexes(
       const MiscComputationInfo &misc_info,
       const std::vector<Index> &input_indexes,
       const std::vector<Index> &output_indexes,
       bool need_backprop) const {
   using namespace time_height_convolution;
   ConvolutionComputationOptions opts;
   opts.max_memory_mb = max_memory_mb_;
   PrecomputedIndexes *ans = new PrecomputedIndexes();
   std::vector<Index> input_indexes_modified,
       output_indexes_modified;
   CompileConvolutionComputation(
       model_, input_indexes, output_indexes, opts,
       &(ans->computation), &input_indexes_modified, &output_indexes_modified);
   if (input_indexes_modified != input_indexes ||
       output_indexes_modified != output_indexes) {
     KALDI_ERR << "Problem precomputing indexes";
   }
   return ans;
 }

 void TimeHeightConvolutionComponent::Scale(BaseFloat scale) {
   if (scale == 0.0) {
     linear_params_.SetZero();
     bias_params_.SetZero();
   } else {
     linear_params_.Scale(scale);
     bias_params_.Scale(scale);
   }
 }

 void TimeHeightConvolutionComponent::Add(BaseFloat alpha,
                                          const Component &other_in) {
   const TimeHeightConvolutionComponent *other =
       dynamic_cast<const TimeHeightConvolutionComponent*>(&other_in);
   KALDI_ASSERT(other != NULL);
   linear_params_.AddMat(alpha, other->linear_params_);
   bias_params_.AddVec(alpha, other->bias_params_);
 }

 void TimeHeightConvolutionComponent::PerturbParams(BaseFloat stddev) {
   CuMatrix<BaseFloat> temp_mat(linear_params_.NumRows(),
                                linear_params_.NumCols(), kUndefined);
   temp_mat.SetRandn();
   linear_params_.AddMat(stddev, temp_mat);
   CuVector<BaseFloat> temp_vec(bias_params_.Dim(), kUndefined);
   temp_vec.SetRandn();
   bias_params_.AddVec(stddev, temp_vec);
 }

 BaseFloat TimeHeightConvolutionComponent::DotProduct(
     const UpdatableComponent &other_in) const {
   const TimeHeightConvolutionComponent *other =
       dynamic_cast<const TimeHeightConvolutionComponent*>(&other_in);
   KALDI_ASSERT(other != NULL);
   return TraceMatMat(linear_params_, other->linear_params_, kTrans) +
       VecVec(bias_params_, other->bias_params_);
 }

 int32 TimeHeightConvolutionComponent::NumParameters() const {
   return linear_params_.NumRows() * linear_params_.NumCols() +
       bias_params_.Dim();
 }

 void TimeHeightConvolutionComponent::Vectorize(
     VectorBase<BaseFloat> *params) const {
   KALDI_ASSERT(params->Dim() == NumParameters());
   int32 linear_size = linear_params_.NumRows() * linear_params_.NumCols(),
       bias_size = bias_params_.Dim();
   params->Range(0, linear_size).CopyRowsFromMat(linear_params_);
   params->Range(linear_size, bias_size).CopyFromVec(bias_params_);
 }

 void TimeHeightConvolutionComponent::UnVectorize(
     const VectorBase<BaseFloat> &params) {
   KALDI_ASSERT(params.Dim() == NumParameters());
   int32 linear_size = linear_params_.NumRows() * linear_params_.NumCols(),
       bias_size = bias_params_.Dim();
   linear_params_.CopyRowsFromVec(params.Range(0, linear_size));
   bias_params_.CopyFromVec(params.Range(linear_size, bias_size));
 }

 void TimeHeightConvolutionComponent::FreezeNaturalGradient(bool freeze) {
   preconditioner_in_.Freeze(freeze);
   preconditioner_out_.Freeze(freeze);
 }

 TimeHeightConvolutionComponent::PrecomputedIndexes*
 TimeHeightConvolutionComponent::PrecomputedIndexes::Copy() const {
   return new PrecomputedIndexes(*this);
 }

 void TimeHeightConvolutionComponent::PrecomputedIndexes::Write(
     std::ostream &os, bool binary) const {
   WriteToken(os, binary, "<TimeHeightConvolutionComponentPrecomputedIndexes>");
   WriteToken(os, binary, "<Computation>");
   computation.Write(os, binary);
   WriteToken(os, binary, "</TimeHeightConvolutionComponentPrecomputedIndexes>");
 }

 void TimeHeightConvolutionComponent::PrecomputedIndexes::Read(
     std::istream &is, bool binary) {
   ExpectOneOrTwoTokens(is, binary,
                        "<TimeHeightConvolutionComponentPrecomputedIndexes>",
                        "<Computation>");
   computation.Read(is, binary);
   ExpectToken(is, binary, "</TimeHeightConvolutionComponentPrecomputedIndexes>");
 }

 void TimeHeightConvolutionComponent::ConsolidateMemory() {
   OnlineNaturalGradient temp_in(preconditioner_in_);
   preconditioner_in_.Swap(&temp_in);
   OnlineNaturalGradient temp_out(preconditioner_out_);
   preconditioner_out_.Swap(&temp_out);
 }

 } // namespace nnet3
 } // namespace kaldi
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::CuMatrixBase::Stride
MatrixIndexT Stride() const
Definition: cu-matrix.h:217

kaldi::nnet3::time_height_convolution::ConvolutionModel::height_subsample_out
int32 height_subsample_out
Definition: convolution.h:132

kaldi::nnet3::time_height_convolution::ConvolutionModel::Write
void Write(std::ostream &os, bool binary) const
Definition: convolution.cc:225

kaldi::ConfigLine::WholeLine
const std::string WholeLine()
Definition: text-utils.h:230

kaldi::nnet3::time_height_convolution::ConvolveBackwardParams
void ConvolveBackwardParams(const ConvolutionComputation &cc, const CuMatrixBase< BaseFloat > &input, const CuMatrixBase< BaseFloat > &output_deriv, BaseFloat alpha, CuMatrixBase< BaseFloat > *params_deriv)
This does the part of the backward derivative computation of convolution, that computes derivatives w...
Definition: convolution.cc:840

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::nnet3::time_height_convolution::ConvolutionModel::ParamCols
int32 ParamCols() const
Definition: convolution.h:208

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes
Definition: nnet-convolutional-component-temp.h:286

kaldi::nnet3::OnlineNaturalGradient::Freeze
void Freeze(bool frozen)
Definition: natural-gradient-online.h:437

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::time_height_convolution::ConvolutionModel::height_in
int32 height_in
Definition: convolution.h:128

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::CuMatrixBase::Row
const CuSubVector< Real > Row(MatrixIndexT i) const
Definition: cu-matrix.h:670

kaldi::nnet3::TimeHeightConvolutionComponent::Check
void Check() const
Definition: nnet-convolutional-component.cc:50

kaldi::nnet3::TimeHeightConvolutionComponent::Vectorize
virtual void Vectorize(VectorBase< BaseFloat > *params) const
Turns the parameters into vector form.
Definition: nnet-convolutional-component.cc:624

kaldi::nnet3::Component
Abstract base-class for neural-net components.
Definition: nnet-component-itf.h:114

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet3::time_height_convolution::ConvolutionModel::Check
bool Check(bool check_heights_used=true, bool allow_height_padding=true) const
Definition: convolution.cc:130

kaldi::SplitStringToIntegers
bool SplitStringToIntegers(const std::string &full, const char *delim, bool omit_empty_strings, std::vector< I > *out)
Split a string (e.g.
Definition: text-utils.h:68

kaldi::nnet3::time_height_convolution::ConvolutionModel::InputDim
int32 InputDim() const
Definition: convolution.h:203

kaldi::nnet3::time_height_convolution::ConvolutionModel::Info
std::string Info() const
Definition: convolution.cc:87

kaldi::nnet3::IndexSet
An abstract representation of a set of Indexes.
Definition: nnet-computation-graph.h:322

kaldi::nnet3::time_height_convolution::ConvolutionModel::num_filters_out
int32 num_filters_out
Definition: convolution.h:127

kaldi::nnet3::UpdatableComponent::InitLearningRatesFromConfig
void InitLearningRatesFromConfig(ConfigLine *cfl)
Definition: nnet-component-itf.cc:248

kaldi::nnet3::time_height_convolution::ConvolutionModel::num_filters_in
int32 num_filters_in
Definition: convolution.h:126

kaldi::nnet3::OnlineNaturalGradient::SetRank
void SetRank(int32 rank)
Definition: natural-gradient-online.cc:604

kaldi::nnet3::time_height_convolution::ConvolutionModel::Offset::height_offset
int32 height_offset
Definition: convolution.h:137

kaldi::CuMatrixBase::SetRandn
void SetRandn()
Definition: cu-matrix.cc:3132

nnet-convolutional-component.h

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::time_height_convolution::ConvolutionModel::ComputeDerived
void ComputeDerived()
Definition: convolution.cc:109

kaldi::nnet3::OnlineNaturalGradient
Keywords for search: natural gradient, naturalgradient, NG-SGD.
Definition: natural-gradient-online.h:414

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet3::TimeHeightConvolutionComponent::FreezeNaturalGradient
virtual void FreezeNaturalGradient(bool freeze)
freezes/unfreezes NaturalGradient updates, if applicable (to be overriden by components that use Natu...
Definition: nnet-convolutional-component.cc:642

kaldi::nnet3::TimeHeightConvolutionComponent::GetInputIndexes
virtual void GetInputIndexes(const MiscComputationInfo &misc_info, const Index &output_index, std::vector< Index > *desired_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-convolutional-component.cc:504

kaldi::CuMatrixBase::CopyRowsFromVec
void CopyRowsFromVec(const CuVectorBase< Real > &v)
This function has two modes of operation.
Definition: cu-matrix.cc:2301

kaldi::nnet3::MiscComputationInfo
Definition: nnet-computation.h:55

kaldi::nnet3::TimeHeightConvolutionComponent::UnVectorize
virtual void UnVectorize(const VectorBase< BaseFloat > &params)
Converts the parameters from vector form.
Definition: nnet-convolutional-component.cc:633

kaldi::nnet3::TimeHeightConvolutionComponent::IsComputable
virtual bool IsComputable(const MiscComputationInfo &misc_info, const Index &output_index, const IndexSet &input_index_set, std::vector< Index > *used_inputs) const
This function only does something interesting for non-simple Components, and it exists to make it pos...
Definition: nnet-convolutional-component.cc:519

kaldi::SortAndUniq
void SortAndUniq(std::vector< T > *vec)
Sorts and uniq&#39;s (removes duplicates) from a vector.
Definition: stl-utils.h:39

kaldi::nnet3::TimeHeightConvolutionComponent::linear_params_
CuMatrix< BaseFloat > linear_params_
Definition: nnet-convolutional-component-temp.h:346

kaldi::nnet3::TimeHeightConvolutionComponent::UpdateNaturalGradient
void UpdateNaturalGradient(const PrecomputedIndexes &indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_deriv)
Definition: nnet-convolutional-component.cc:354

kaldi::nnet3::TimeHeightConvolutionComponent::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)
Initialize, from a ConfigLine object.
Definition: nnet-convolutional-component.cc:114

kaldi::nnet3::TimeHeightConvolutionComponent::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const
Propagate function.
Definition: nnet-convolutional-component.cc:282

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

kaldi::nnet3::time_height_convolution::ConvolutionModel::all_time_offsets
std::set< int32 > all_time_offsets
Definition: convolution.h:173

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputeIndexes
virtual ComponentPrecomputedIndexes * PrecomputeIndexes(const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const
This function must return NULL for simple Components.
Definition: nnet-convolutional-component.cc:560

kaldi::CuMatrixBase::CopyColFromVec
void CopyColFromVec(const CuVectorBase< Real > &v, const MatrixIndexT col)
Copy vector into specific column of matrix.
Definition: cu-matrix.cc:2414

kaldi::nnet3::TimeHeightConvolutionComponent::preconditioner_out_
OnlineNaturalGradient preconditioner_out_
Definition: nnet-convolutional-component-temp.h:372

kaldi::ExpectOneOrTwoTokens
void ExpectOneOrTwoTokens(std::istream &is, bool binary, const std::string &token1, const std::string &token2)
This function is like ExpectToken but for two tokens, and it will either accept token1 and then token...
Definition: text-utils.cc:536

kaldi::nnet3::TimeHeightConvolutionComponent::all_time_offsets_
std::vector< int32 > all_time_offsets_
Definition: nnet-convolutional-component-temp.h:334

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::nnet3::Index::x
int32 x
Definition: nnet-common.h:47

kaldi::nnet3::time_height_convolution::ConvolutionModel::Offset
Definition: convolution.h:135

kaldi::nnet3::time_height_convolution::ConvolutionModel::ParamRows
int32 ParamRows() const
Definition: convolution.h:206

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::Copy
virtual PrecomputedIndexes * Copy() const
Definition: nnet-convolutional-component.cc:648

kaldi::nnet3::Index::n
int32 n
Definition: nnet-common.h:45

kaldi::nnet3::time_height_convolution::ConvolutionModel::OutputDim
int32 OutputDim() const
Definition: convolution.h:204

kaldi::nnet3::TimeHeightConvolutionComponent::Scale
virtual void Scale(BaseFloat scale)
This virtual function when called on – an UpdatableComponent scales the parameters by "scale" when c...
Definition: nnet-convolutional-component.cc:581

kaldi::nnet3::TimeHeightConvolutionComponent::Read
virtual void Read(std::istream &is, bool binary)
Read function (used after we know the type of the Component); accepts input that is missing the token...
Definition: nnet-convolutional-component.cc:452

kaldi::nnet3::TimeHeightConvolutionComponent::TimeHeightConvolutionComponent
TimeHeightConvolutionComponent()
Definition: nnet-convolutional-component.cc:31

kaldi::nnet3::ExpectToken
static void ExpectToken(const std::string &token, const std::string &what_we_are_parsing, const std::string **next_token)
Definition: nnet-descriptor.cc:45

float

kaldi::nnet3::time_height_convolution::ConvolveBackwardData
void ConvolveBackwardData(const ConvolutionComputation &cc, const CuMatrixBase< BaseFloat > &params, const CuMatrixBase< BaseFloat > &output_deriv, CuMatrixBase< BaseFloat > *input_deriv)
This does the part of the backward derivative computation of convolution, that propagates derivatives...
Definition: convolution.cc:682

kaldi::nnet3::time_height_convolution::ConvolutionModel::Read
void Read(std::istream &is, bool binary)
Definition: convolution.cc:252

kaldi::nnet3::TimeHeightConvolutionComponent::Add
virtual void Add(BaseFloat alpha, const Component &other)
This virtual function when called by – an UpdatableComponent adds the parameters of another updatabl...
Definition: nnet-convolutional-component.cc:591

kaldi::nnet3::TimeHeightConvolutionComponent::ComputeDerived
void ComputeDerived()
Definition: nnet-convolutional-component.cc:491

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::Write
virtual void Write(std::ostream &os, bool binary) const
Definition: nnet-convolutional-component.cc:652

kaldi::nnet3::TimeHeightConvolutionComponent::ReorderIndexes
virtual void ReorderIndexes(std::vector< Index > *input_indexes, std::vector< Index > *output_indexes) const
This function only does something interesting for non-simple Components.
Definition: nnet-convolutional-component.cc:408

kaldi::nnet3::TimeHeightConvolutionComponent::model_
time_height_convolution::ConvolutionModel model_
Definition: nnet-convolutional-component-temp.h:330

kaldi::SplitStringToVector
void SplitStringToVector(const std::string &full, const char *delim, bool omit_empty_strings, std::vector< std::string > *out)
Split a string using any of the single character delimiters.
Definition: text-utils.cc:63

nnet-computation-graph.h

kaldi::nnet3::UpdatableComponent::learning_rate_
BaseFloat learning_rate_
learning rate (typically 0.0..0.01)
Definition: nnet-component-itf.h:559

kaldi::nnet3::TimeHeightConvolutionComponent::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...
Definition: nnet-convolutional-component.cc:301

kaldi::nnet3::UpdatableComponent::ReadUpdatableCommon
std::string ReadUpdatableCommon(std::istream &is, bool binary)
Definition: nnet-component-itf.cc:263

kaldi::nnet3::TimeHeightConvolutionComponent::UpdateSimple
void UpdateSimple(const PrecomputedIndexes &indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_deriv)
Definition: nnet-convolutional-component.cc:334

kaldi::nnet3::TimeHeightConvolutionComponent::InitUnit
void InitUnit()
Definition: nnet-convolutional-component.cc:88

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::nnet3::TimeHeightConvolutionComponent::OutputDim
virtual int32 OutputDim() const
Returns output-dimension of this component.
Definition: nnet-convolutional-component.cc:61

kaldi::nnet3::OnlineNaturalGradient::PreconditionDirections
void PreconditionDirections(CuMatrixBase< BaseFloat > *X, BaseFloat *scale)
This call implements the main functionality of this class.
Definition: natural-gradient-online.cc:159

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::nnet3::time_height_convolution::CompileConvolutionComputation
void CompileConvolutionComputation(const ConvolutionModel &model, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, const ConvolutionComputationOptions &opts, ConvolutionComputation *computation, std::vector< Index > *input_indexes_modified, std::vector< Index > *output_indexes_modified)
This function does the compilation for a convolution computation; it&#39;s a wrapper for the functions be...
Definition: convolution.cc:1367

kaldi::TraceMatMat
Real TraceMatMat(const MatrixBase< Real > &A, const MatrixBase< Real > &B, MatrixTransposeType trans)
We need to declare this here as it will be a friend function.
Definition: kaldi-matrix.cc:2692

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::nnet3::time_height_convolution::ConvolutionModel::offsets
std::vector< Offset > offsets
Definition: convolution.h:157

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

nnet-parse.h

kaldi::CuMatrixBase::RowRange
CuSubMatrix< Real > RowRange(const MatrixIndexT row_offset, const MatrixIndexT num_rows) const
Definition: cu-matrix.h:660

kaldi::nnet3::OnlineNaturalGradient::Swap
void Swap(OnlineNaturalGradient *other)
Definition: natural-gradient-online.cc:628

kaldi::nnet3::TimeHeightConvolutionComponent::DotProduct
virtual BaseFloat DotProduct(const UpdatableComponent &other) const
Computes dot-product between parameters of two instances of a Component.
Definition: nnet-convolutional-component.cc:610

kaldi::nnet3::TimeHeightConvolutionComponent::Write
virtual void Write(std::ostream &os, bool binary) const
Write component to stream.
Definition: nnet-convolutional-component.cc:424

kaldi::nnet3::time_height_convolution::ConvolutionModel::height_out
int32 height_out
Definition: convolution.h:129

kaldi::nnet3::TimeHeightConvolutionComponent::InputDim
virtual int32 InputDim() const
Returns input-dimension of this component.
Definition: nnet-convolutional-component.cc:57

kaldi::nnet3::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters; it extends the interface of C...
Definition: nnet-component-itf.h:455

kaldi::nnet3::OnlineNaturalGradient::SetAlpha
void SetAlpha(BaseFloat alpha)
Definition: natural-gradient-online.cc:623

kaldi::CuVectorBase::SetRandn
void SetRandn()
Definition: cu-vector.cc:281

kaldi::nnet3::OnlineNaturalGradient::GetNumMinibatchesHistory
BaseFloat GetNumMinibatchesHistory() const
Definition: natural-gradient-online.h:431

kaldi::CuMatrixBase::Data
const Real * Data() const
Return data pointer (const).
Definition: cu-matrix.h:746

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::nnet3::ComponentPrecomputedIndexes
Definition: nnet-component-itf.h:97

kaldi::ConfigLine
This class is responsible for parsing input like hi-there xx=yyy a=b c empty= f-oo=Append(bar, sss) ba_z=123 bing=&#39;a b c&#39; baz="a b c d=&#39;a b&#39; e" and giving you access to the fields, in this case.
Definition: text-utils.h:205

kaldi::nnet3::UpdatableComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-component-itf.cc:333

kaldi::nnet3::UpdatableComponent::is_gradient_
bool is_gradient_
True if this component is to be treated as a gradient rather than as parameters.
Definition: nnet-component-itf.h:566

kaldi::nnet3::TimeHeightConvolutionComponent::PerturbParams
virtual void PerturbParams(BaseFloat stddev)
This function is to be used in testing.
Definition: nnet-convolutional-component.cc:600

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet3::UpdatableComponent::WriteUpdatableCommon
void WriteUpdatableCommon(std::ostream &is, bool binary) const
Definition: nnet-component-itf.cc:306

kaldi::nnet3::TimeHeightConvolutionComponent::bias_params_
CuVector< BaseFloat > bias_params_
Definition: nnet-convolutional-component-temp.h:349

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::Read
virtual void Read(std::istream &os, bool binary)
Definition: nnet-convolutional-component.cc:660

NVTX_RANGE
#define NVTX_RANGE(name)
Definition: cu-common.h:143

kaldi::nnet3::time_height_convolution::ConvolutionModel::required_time_offsets
std::set< int32 > required_time_offsets
Definition: convolution.h:169

kaldi::nnet3::TimeHeightConvolutionComponent::NumParameters
virtual int32 NumParameters() const
The following new virtual function returns the total dimension of the parameters in this class...
Definition: nnet-convolutional-component.cc:619

kaldi::ConfigLine::GetValue
bool GetValue(const std::string &key, std::string *value)
Definition: text-utils.cc:427

kaldi::nnet3::TimeHeightConvolutionComponent::ConsolidateMemory
void ConsolidateMemory()
This virtual function relates to memory management, and avoiding fragmentation.
Definition: nnet-convolutional-component.cc:669

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet3::OnlineNaturalGradient::SetNumMinibatchesHistory
void SetNumMinibatchesHistory(BaseFloat num_minibatches_history)
Definition: natural-gradient-online.cc:617

kaldi::nnet3::OnlineNaturalGradient::GetAlpha
BaseFloat GetAlpha() const
Definition: natural-gradient-online.h:432

kaldi::nnet3::PrintParameterStats
void PrintParameterStats(std::ostringstream &os, const std::string &name, const CuVectorBase< BaseFloat > &params, bool include_mean)
Print to &#39;os&#39; some information about the mean and standard deviation of some parameters, used in Info() functions in nnet-simple-component.cc.
Definition: nnet-parse.cc:157

kaldi::nnet3::Index::t
int32 t
Definition: nnet-common.h:46

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::nnet3::TimeHeightConvolutionComponent::use_natural_gradient_
bool use_natural_gradient_
Definition: nnet-convolutional-component-temp.h:362

kaldi::nnet3::TimeHeightConvolutionComponent::preconditioner_in_
OnlineNaturalGradient preconditioner_in_
Definition: nnet-convolutional-component-temp.h:368

kaldi::nnet3::TimeHeightConvolutionComponent::time_offset_required_
std::vector< bool > time_offset_required_
Definition: nnet-convolutional-component-temp.h:338

kaldi::IsSortedAndUniq
bool IsSortedAndUniq(const std::vector< T > &vec)
Returns true if the vector is sorted and contains each element only once.
Definition: stl-utils.h:63

kaldi::VecVec
Real VecVec(const VectorBase< Real > &a, const VectorBase< Real > &b)
Returns dot product between v1 and v2.
Definition: kaldi-vector.cc:37

kaldi::nnet3::TimeHeightConvolutionComponent
TimeHeightConvolutionComponent implements 2-dimensional convolution where one of the dimensions of co...
Definition: nnet-convolutional-component-temp.h:212

kaldi::nnet3::TimeHeightConvolutionComponent::max_memory_mb_
BaseFloat max_memory_mb_
Definition: nnet-convolutional-component-temp.h:356

kaldi::nnet3::time_height_convolution::ConvolveForward
void ConvolveForward(const ConvolutionComputation &cc, const CuMatrixBase< BaseFloat > &input, const CuMatrixBase< BaseFloat > &params, CuMatrixBase< BaseFloat > *output)
This does the forward computation of convolution.
Definition: convolution.cc:524

kaldi::nnet3::TimeHeightConvolutionComponent::Info
virtual std::string Info() const
Returns some text-form information about this component, for diagnostics.
Definition: nnet-convolutional-component.cc:65

kaldi::nnet3::time_height_convolution::ConvolutionModel::Offset::time_offset
int32 time_offset
Definition: convolution.h:136

kaldi::nnet3::kNoTime
const int kNoTime
Definition: nnet-common.cc:573

kaldi::nnet3::OnlineNaturalGradient::GetRank
int32 GetRank() const
Definition: natural-gradient-online.h:433

kaldi::VectorBase::Range
SubVector< Real > Range(const MatrixIndexT o, const MatrixIndexT l)
Returns a sub-vector of a vector (a range of elements).
Definition: kaldi-vector.h:94

kaldi::nnet3::TimeHeightConvolutionComponent::PrecomputedIndexes::computation
time_height_convolution::ConvolutionComputation computation
Definition: nnet-convolutional-component-temp.h:299