doc/nnet3_2nnet-compute_8cc_source.html

 // nnet3/nnet-compute.cc

 // Copyright      2015  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <iterator>
 #include <sstream>
 #include "nnet3/nnet-compute.h"

 namespace kaldi {
 namespace nnet3 {


 NnetComputer::NnetComputer(const NnetComputeOptions &options,
                            const NnetComputation &computation,
                            const Nnet &nnet,
                            Nnet *nnet_to_update):
     options_(options), computation_(computation), nnet_(nnet),
     program_counter_(0), nnet_to_store_stats_(nnet_to_update),
     nnet_to_update_(nnet_to_update) {
   Init();
 }

 NnetComputer::NnetComputer(const NnetComputeOptions &options,
                            const NnetComputation &computation,
                            Nnet *nnet,
                            Nnet *nnet_to_update):
     options_(options), computation_(computation), nnet_(*nnet),
     program_counter_(0), nnet_to_store_stats_(nnet),
     nnet_to_update_(nnet_to_update) {
   Init();
 }

 void NnetComputer::Init() {
   KALDI_ASSERT(computation_.indexes_cuda.size() == computation_.indexes.size() &&
  computation_.indexes_ranges_cuda.size() == computation_.indexes_ranges.size() &&
                "You must call NnetComputation::ComputeCudaIndexes() before "
                "executing the computation.");
   matrices_.resize(computation_.matrices.size());
   debug_ = (options_.debug || GetVerboseLevel() >= 5);
   if (debug_) {
     ComputationVariables variables;
     variables.Init(computation_);
     ComputeCommandAttributes(nnet_, computation_, variables,
                              &command_attributes_);
     std::string preamble;
     computation_.GetCommandStrings(nnet_, &preamble, &command_strings_);
     KALDI_LOG << preamble;
     computation_.GetSubmatrixStrings(nnet_, &submatrix_strings_);
   }
 }

 //static
 BaseFloat NnetComputer::MatrixStddev(const CuMatrixBase<BaseFloat> &m) {
   if (m.NumRows() == 0)
     return 0.0;
   return std::sqrt(TraceMatMat(m, m, kTrans) / (m.NumRows() * m.NumCols()));
 }

 //static
 BaseFloat NnetComputer::ParameterStddev(const Component &c) {
   const UpdatableComponent *uc = dynamic_cast<const UpdatableComponent*>(&c);
   KALDI_ASSERT(uc != NULL &&
                "Attempting to get parameter stddev of non-updatable component");
   return std::sqrt(uc->DotProduct(*uc) / uc->NumParameters());
 }

 void NnetComputer::DebugBeforeExecute(int32 command,
                                       CommandDebugInfo *info) {
   {
     const std::vector<int32> &matrices_written =
         command_attributes_[command].matrices_written;
     size_t size = matrices_written.size();
     info->matrices_written_stddevs.resize(size);
     for (size_t i = 0; i < size; i++) {
       int32 m = matrices_written[i];
       info->matrices_written_stddevs[i] = MatrixStddev(matrices_[m]);
     }
   }
   {
     const std::vector<int32> &submatrices_written =
         command_attributes_[command].submatrices_written;
     size_t size = submatrices_written.size();
     info->submatrices_written_stddevs.resize(size);
     for (size_t i = 0; i < size; i++) {
       int32 s = submatrices_written[i];
       if (!computation_.IsWholeMatrix(s)) {
         const CuSubMatrix<BaseFloat> submat(GetSubMatrix(s));
         info->submatrices_written_stddevs[i] = MatrixStddev(submat);
       }
     }
   }
   const NnetComputation::Command &c = computation_.commands[command];
   if (c.command_type == kBackprop) {
     const Component *component = nnet_.GetComponent(c.arg1);
     if (component->Properties() & kUpdatableComponent)
       info->components_parameter_stddev = ParameterStddev(*component);
   }
 }


 void NnetComputer::DebugAfterExecute(int32 command,
                                      const CommandDebugInfo &info,
                                      double command_exec_time) {
   std::ostringstream os;
   os << command_strings_[command] << "\t|\t";
   {
     const std::vector<int32> &matrices_written =
         command_attributes_[command].matrices_written;
     size_t size = matrices_written.size();
     KALDI_ASSERT(info.matrices_written_stddevs.size() == size);
     for (size_t i = 0; i < size; i++) {
       int32 m = matrices_written[i];
       BaseFloat old_stddev = info.matrices_written_stddevs[i],
           stddev = MatrixStddev(matrices_[m]);
       os << 'm' << m << ": " << old_stddev << "->" << stddev << " ";
     }
   }
   {
     const std::vector<int32> &submatrices_written =
         command_attributes_[command].submatrices_written;
     size_t size = submatrices_written.size();
     KALDI_ASSERT(info.submatrices_written_stddevs.size() == size);
     for (size_t i = 0; i < size; i++) {
       int32 s = submatrices_written[i];
       if (!computation_.IsWholeMatrix(s)) {
         const CuSubMatrix<BaseFloat> submat(GetSubMatrix(s));
         BaseFloat old_stddev = info.submatrices_written_stddevs[i],
             stddev = MatrixStddev(submat);
         os << submatrix_strings_[s] << ": " << old_stddev << "->"
            << stddev << " ";
       }
     }
   }
   const NnetComputation::Command &c = computation_.commands[command];
   if (c.command_type == kBackprop) {
     const Component *component = nnet_.GetComponent(c.arg1);
     if (component->Properties() & kUpdatableComponent) {
       const std::string &component_name = nnet_.GetComponentName(c.arg1);
       os << component_name << ": " << info.components_parameter_stddev
          << "->" << ParameterStddev(*component) << " ";
     }
   }
   os << "\t|\t time: " << command_exec_time << " secs";
   KALDI_LOG << os.str();
 }


 void NnetComputer::SaveMemo(int32 memo_index,
                             const Component &c, void *memo) {
   if (memo_index <= 0) {
     if (memo != NULL) {  // memo was returned but is not needed.
       c.DeleteMemo(memo);
     }
   } else {
     if (memos_.size() <= static_cast<size_t>(memo_index))
       memos_.resize(memo_index + 1, NULL);
     memos_[memo_index] = memo;
   }
 }

 void* NnetComputer::GetMemo(int32 memo_index) {
   if (memo_index == 0) {
     return NULL;
   } else {
     if (static_cast<size_t>(memo_index) >= memos_.size())
       KALDI_ERR << "Memo requested that was not generated.";
     void *ans = memos_[memo_index];
     memos_[memo_index] = NULL;
     return ans;
   }
 }


 NnetComputer::NnetComputer(const NnetComputer &other):
     options_(other.options_),
     computation_(other.computation_),
     nnet_(other.nnet_),
     program_counter_(other.program_counter_),
     pending_commands_(other.pending_commands_),
     nnet_to_store_stats_(other.nnet_to_store_stats_),
     nnet_to_update_(other.nnet_to_update_),
     debug_(other.debug_),
     command_attributes_(other.command_attributes_),
     submatrix_strings_(other.submatrix_strings_),
     command_strings_(other.command_strings_),
     matrices_(other.matrices_),
     memos_(other.memos_) {
   // Note: this is the same as the default copy constructor, except for the check below.
   if (!memos_.empty()) {
     KALDI_ERR << "You cannot use the copy constructor of NnetComputer if "
         "memos are used.";
   }
 }

 void NnetComputer::ExecuteCommand() {
   const NnetComputation::Command &c = computation_.commands[program_counter_];
   int32 m1, m2;
   try {
     switch (c.command_type) {
       case kAllocMatrix:
         m1 = computation_.submatrices[c.arg1].matrix_index;
         matrices_[m1].Resize(computation_.matrices[m1].num_rows,
                              computation_.matrices[m1].num_cols,
                              kUndefined,
                              computation_.matrices[m1].stride_type);
         break;
       case kDeallocMatrix:
         m1 = computation_.submatrices[c.arg1].matrix_index;
         matrices_[m1].Resize(0, 0);
         break;
       case kSwapMatrix:
         m1 = computation_.submatrices[c.arg1].matrix_index;
         m2 = computation_.submatrices[c.arg2].matrix_index;
         matrices_[m1].Swap(&(matrices_[m2]));
         break;
       case kSetConst: {
         CuSubMatrix<BaseFloat> s(GetSubMatrix(c.arg1));
         if (c.alpha == 0.0) s.SetZero();
         else s.Set(c.alpha);
         break;
       }
       case kPropagate: {
         NVTX_RANGE("NnetComputer::ExecuteCommand::kPropagate");
         const Component *component = nnet_.GetComponent(c.arg1);
         ComponentPrecomputedIndexes *indexes =
             computation_.component_precomputed_indexes[c.arg2].data;
         const CuSubMatrix<BaseFloat> input(GetSubMatrix(c.arg3));
         CuSubMatrix<BaseFloat> output(GetSubMatrix(c.arg4));
         void *memo = component->Propagate(indexes, input, &output);
         if (c.arg6) {  // need to store stats.
           KALDI_ASSERT(nnet_to_store_stats_ != NULL);
           Component *stats_component = nnet_to_store_stats_->GetComponent(c.arg1);
           bool was_in_place = (c.arg3 == c.arg4);
           // if propagate was in-place, provide empty matrix and not 'input', as
           // input is no longer valid.
           const CuSubMatrix<BaseFloat> maybe_input(
               GetSubMatrix(was_in_place ? 0 : c.arg3));
           stats_component->StoreStats(maybe_input, output, memo);
         }
         SaveMemo(c.arg5, *component, memo);
         break;
       }
       case kBackprop:
       case kBackpropNoModelUpdate:  {
         NVTX_RANGE("NnetComputer::ExecuteCommand::kBackpropNoModelUpdate");
         std::ostringstream debug_str;
         KALDI_ASSERT(nnet_to_update_ != NULL);
         debug_str << nnet_.GetComponentName(c.arg1);
         const Component *component = nnet_.GetComponent(c.arg1);
         KALDI_ASSERT(!(computation_.need_model_derivative && !nnet_to_update_));
         Component *upd_component = NULL;
         if (c.command_type == kBackprop) {  // this block sets 'upd_component'
           Nnet *nnet_to_update;
           if (component->Properties()&kUpdatableComponent) {
             nnet_to_update = (computation_.need_model_derivative ?
                               nnet_to_update_ : NULL);
           } else {
             // Some non-updatable components, such as CompositeComponent, store
             // stats in the backprop.  For other types of non-updatable
             // component, this arg won't matter.
             nnet_to_update = nnet_to_store_stats_;
           }
           if (nnet_to_update)
             upd_component = nnet_to_update->GetComponent(c.arg1);
         }
         ComponentPrecomputedIndexes *indexes =
             computation_.component_precomputed_indexes[c.arg2].data;
         const CuSubMatrix<BaseFloat> in_value(GetSubMatrix(c.arg3));
         const CuSubMatrix<BaseFloat> out_value(GetSubMatrix(c.arg4));
         const CuSubMatrix<BaseFloat> out_deriv(GetSubMatrix(c.arg5));
         CuSubMatrix<BaseFloat> in_deriv(GetSubMatrix(c.arg6));
         void *memo = GetMemo(c.arg7);
         component->Backprop(debug_str.str(), indexes,
                             in_value, out_value, out_deriv,
                             memo, upd_component,
                             c.arg6 == 0 ? NULL : &in_deriv);
         if (memo != NULL)
           component->DeleteMemo(memo);
         break;
       }
       case kMatrixCopy: {
         CuSubMatrix<BaseFloat> dest(GetSubMatrix(c.arg1));
         const CuSubMatrix<BaseFloat> src(GetSubMatrix(c.arg2));
         dest.CopyFromMat(src);
         if (c.alpha != 1.0)
           dest.Scale(c.alpha);  // note: in principle in future we could write a
                                 // kernel which would do this in one operation.
         break;
       }
       case kMatrixAdd: {
         CuSubMatrix<BaseFloat> dest(GetSubMatrix(c.arg1));
         const CuSubMatrix<BaseFloat> src(GetSubMatrix(c.arg2));
         dest.AddMat(c.alpha, src);
         break;
       }
       case kAddRows: {
         CuSubMatrix<BaseFloat> dest(GetSubMatrix(c.arg1));
         const CuSubMatrix<BaseFloat> src(GetSubMatrix(c.arg2));
         const CuArray<int32> &indexes = computation_.indexes_cuda[c.arg3];
         dest.AddRows(c.alpha, src, indexes);
         break;
       }
       case kCopyRows: {
         CuSubMatrix<BaseFloat> dest(GetSubMatrix(c.arg1));
         const CuSubMatrix<BaseFloat> src(GetSubMatrix(c.arg2));
         const CuArray<int32> &indexes = computation_.indexes_cuda[c.arg3];
         BaseFloat alpha = c.alpha;
         if (alpha != 1.0) {            // for now we're faking the 'alpha' thing because the CopyRows
           if (alpha == 0.0) break;     // command doesn't take that argument.
           dest.Scale(1.0 / alpha);
           dest.CopyRows(src, indexes);
           dest.Scale(c.alpha);
         } else {
           dest.CopyRows(src, indexes);
         }
         break;
       }
       case kCopyRowsMulti: {
         CuSubMatrix<BaseFloat> dest(GetSubMatrix(c.arg1));
         CuArray<const BaseFloat*> pointers;
         GetPointers(c.arg2, dest.NumCols(), &pointers);
         BaseFloat alpha = c.alpha;
         if (alpha != 1.0) {            // for now we're faking the 'alpha' thing because the CopyRows
           if (alpha == 0.0) break;     // command doesn't take that argument.
           dest.Scale(1.0 / alpha);
           dest.CopyRows(pointers);
           dest.Scale(c.alpha);
         } else {
           dest.CopyRows(pointers);
         }
         break;
       }
       case kCopyToRowsMulti: {
         // If c.alpha is not 1.0, this command is not supported.
         KALDI_ASSERT(c.alpha == 1.0);
         CuSubMatrix<BaseFloat> src(GetSubMatrix(c.arg1));
         CuArray<BaseFloat*> pointers;
         GetPointers(c.arg2, src.NumCols(), &pointers);
         src.CopyToRows(pointers);
         break;
       }
       case kAddRowsMulti: {
         CuSubMatrix<BaseFloat> dest(GetSubMatrix(c.arg1));
         CuArray<const BaseFloat*> pointers;
         GetPointers(c.arg2, dest.NumCols(), &pointers);
         dest.AddRows(c.alpha, pointers);
         break;
       }
       case kAddToRowsMulti: {
         CuSubMatrix<BaseFloat> src(GetSubMatrix(c.arg1));
         CuArray<BaseFloat*> pointers;
         GetPointers(c.arg2, src.NumCols(), &pointers);
         src.AddToRows(c.alpha, pointers);
         break;
       }
       case kAddRowRanges: {
         CuSubMatrix<BaseFloat> dest(GetSubMatrix(c.arg1));
         const CuSubMatrix<BaseFloat> src(GetSubMatrix(c.arg2));
         const CuArray<Int32Pair> &pairs = computation_.indexes_ranges_cuda[c.arg3];
         BaseFloat alpha = c.alpha;
         if (alpha != 1.0) {            // for now we're faking the 'alpha' thing
                                        // because the AddRowRanges
           if (alpha == 0.0) break;     // command doesn't take that argument.
           dest.Scale(1.0 / alpha);
           dest.AddRowRanges(src, pairs);
           dest.Scale(c.alpha);
         } else {
           dest.AddRowRanges(src, pairs);
         }
         break;
       }
       case kCompressMatrix:
         // This does nothing if CUDA is not in use.
 #if HAVE_CUDA == 1
         if (CuDevice::Instantiate().Enabled()) {
           if (compressed_matrices_.empty())
             compressed_matrices_.resize(matrices_.size(), NULL);
           int32 m = computation_.submatrices[c.arg1].matrix_index;
           KALDI_ASSERT(compressed_matrices_[m] == NULL &&
                        matrices_[m].NumRows() != 0);
           BaseFloat range = c.alpha;
           bool truncate = (c.arg3 != 0);
           compressed_matrices_[m] = NewCuCompressedMatrix(
               static_cast<CuCompressedMatrixType>(c.arg2),
               range, truncate);
           compressed_matrices_[m]->CopyFromMat(matrices_[m]);
           matrices_[m].Resize(0, 0);
         }
 #endif
         break;
       case kDecompressMatrix:
 #if HAVE_CUDA == 1
         if (CuDevice::Instantiate().Enabled()) {
           int32 m = computation_.submatrices[c.arg1].matrix_index;
           CuCompressedMatrixBase *compressed_matrix =
               compressed_matrices_[m];
           KALDI_ASSERT(compressed_matrix != NULL &&
                        matrices_[m].NumRows() == 0);
           matrices_[m].Resize(compressed_matrix->NumRows(),
                               compressed_matrix->NumCols(),
                               kUndefined,
                               computation_.matrices[m].stride_type);
           compressed_matrix->CopyToMat(&(matrices_[m]));
           delete compressed_matrix;
           compressed_matrices_[m] = NULL;
         }
 #endif
         break;
       case kNoOperation: case kNoOperationPermanent: case kNoOperationMarker:
       case kNoOperationLabel:
         break;
       case kGotoLabel:
         KALDI_ASSERT(computation_.commands[c.arg1].command_type == kNoOperationLabel);
         program_counter_ = c.arg1;
         break;
       default:
         KALDI_ERR << "Invalid command in computation";
     }
   } catch (...) {
     if (!debug_) {
       std::string preamble;
       computation_.GetCommandStrings(nnet_, &preamble, &command_strings_);
       KALDI_WARN << "Printing some background info since error was detected";
       KALDI_LOG << preamble;
       for (int32 prev_c = 0; prev_c < program_counter_; prev_c++)
         KALDI_LOG << command_strings_[prev_c];
     }
     // the following will re-throw the error, but now we've printed more info
     // about what went wrong.
     KALDI_ERR << "Error running command " << command_strings_[program_counter_];
   }
 }

 CuSubMatrix<BaseFloat> NnetComputer::GetSubMatrix(int32 submatrix_index) {
   KALDI_PARANOID_ASSERT(static_cast<size_t>(submatrix_index) <
                         computation_.submatrices.size());
   const NnetComputation::SubMatrixInfo &info =
       computation_.submatrices[submatrix_index];
   const CuMatrix<BaseFloat> &mat = matrices_[info.matrix_index];
   return CuSubMatrix<BaseFloat>(
       mat, info.row_offset, info.num_rows, info.col_offset, info.num_cols);
 }

 void NnetComputer::GetPointers(int32 indexes_multi_index,
                                int32 num_cols,
                                CuArray<BaseFloat*> *pointers) {
   KALDI_ASSERT(static_cast<size_t>(indexes_multi_index)
                < computation_.indexes_multi.size());
   const std::vector<std::pair<int32,int32> > &pairs =
       computation_.indexes_multi[indexes_multi_index];
   int32 size = pairs.size();
   std::vector<BaseFloat*> vec(size);

   // the map "lookup" maps from submatrix index to the Data()
   // pointer of that submatrix, and the corresponding Stride().
   unordered_map<int32, std::pair<BaseFloat*, int32> > lookup;

   for (int32 i = 0; i < size; i++) {
     int32 submatrix_index = pairs[i].first, row = pairs[i].second;
     if (submatrix_index != -1) {
       unordered_map<int32, std::pair<BaseFloat*, int32> >::iterator
           iter = lookup.find(submatrix_index);
       if (iter == lookup.end()) {
         CuSubMatrix<BaseFloat> m = GetSubMatrix(submatrix_index);
         lookup[submatrix_index] = std::pair<BaseFloat*, int32>(m.Data(),
                                                                m.Stride());
         iter = lookup.find(submatrix_index);
       }
       BaseFloat *data = iter->second.first;
       int32 stride = iter->second.second;
       vec[i] = data + (row * stride);
     } else {
       // -1 is a marker that will be translated to NULL.
       vec[i] = NULL;
     }
   }
 #ifdef KALDI_PARANOID
   for (int32 i = 0; i < size; i += 30 + RandInt(0, 9)) {
     // Do a pseudo-random spot check that the row-indexes are not out of range.
     int32 submatrix_index = pairs[i].first, row = pairs[i].second;
     if (submatrix_index != -1) {
       CuSubMatrix<BaseFloat> m = GetSubMatrix(submatrix_index);
       KALDI_ASSERT(row >= 0 && row < m.NumRows() && num_cols == m.NumCols());
     }
   }
 #endif
   pointers->CopyFromVec(vec);
 }

 void NnetComputer::GetPointers(int32 indexes_multi_index,
                                int32 num_cols,
                                CuArray<const BaseFloat*> *pointers) {
   GetPointers(indexes_multi_index, num_cols,
               reinterpret_cast<CuArray<BaseFloat*>*>(pointers));
 }

 void NnetComputer::Run() {
   NVTX_RANGE(__func__);
   const std::vector<NnetComputation::Command> &c = computation_.commands;
   int32 num_commands = c.size();

   if (program_counter_ >= num_commands) {
     computation_.Print(std::cerr, nnet_);
     KALDI_ERR << "Running computation that has finished: program-counter="
               << program_counter_;
   }
   CheckNoPendingIo();

   CommandDebugInfo info;
   Timer timer;
   double total_elapsed_previous = 0.0;

   for (; program_counter_ < num_commands; program_counter_++) {
     if (c[program_counter_].command_type == kAcceptInput ||
         c[program_counter_].command_type == kProvideOutput) {
       // We have hit a part of the computation that requires user
       // interaction, e.g. the end of the forward or backward phase.
       break;
     }
     if (debug_)
       DebugBeforeExecute(program_counter_, &info);
     ExecuteCommand();
     if (debug_) {
       double total_elapsed_now = timer.Elapsed();
       DebugAfterExecute(program_counter_, info,
                         total_elapsed_now - total_elapsed_previous);
       total_elapsed_previous = total_elapsed_now;
     }
   }
 }

 void NnetComputer::AcceptInput(const std::string &node_name,
                                CuMatrix<BaseFloat> *input) {
   bool is_output = false;
   int32 matrix_index = GetIoMatrixIndex(node_name, is_output);

   const NnetComputation::MatrixInfo &matrix_info =
       computation_.matrices[matrix_index];
   if (input->NumRows() != matrix_info.num_rows) {
     KALDI_ERR << "Num-rows mismatch for input '" << node_name
               << "': " << matrix_info.num_rows
               <<  " in computation-request, " << input->NumRows()
               << " provided.";
   }
   if (input->NumCols() != matrix_info.num_cols) {
     KALDI_ERR << "Num-cols mismatch for input '" << node_name
               << "': " << matrix_info.num_cols
               <<  " in computation-request, " << input->NumCols()
               << " provided.";
   }
   if (matrix_info.stride_type == kDefaultStride ||
       input->Stride() == input->NumCols()) {
     matrices_[matrix_index].Swap(input);
   } else {
     matrices_[matrix_index].Resize(matrix_info.num_rows,
                                    matrix_info.num_cols,
                                    kUndefined, kStrideEqualNumCols);
     matrices_[matrix_index].CopyFromMat(*input);
     input->Resize(0, 0);
   }
 }

 const CuMatrixBase<BaseFloat> &NnetComputer::GetOutput(
     const std::string &node_name) {
   bool is_output = true;
   int32 matrix_index = GetIoMatrixIndex(node_name, is_output);
   KALDI_ASSERT(matrices_[matrix_index].NumRows() != 0);
   return matrices_[matrix_index];
 }


 void NnetComputer::GetOutputDestructive(const std::string &node_name,
                                         CuMatrix<BaseFloat> *output) {
   bool is_output = true;
   int32 matrix_index = GetIoMatrixIndex(node_name, is_output);
   KALDI_ASSERT(matrices_[matrix_index].NumRows() != 0);
   matrices_[matrix_index].Swap(output);
   matrices_[matrix_index].Resize(0, 0);
 }


 void NnetComputer::CheckNoPendingIo() {
   const std::vector<NnetComputation::Command> &c = computation_.commands;
   while (program_counter_ < static_cast<int32>(c.size()) &&
          (c[program_counter_].command_type == kAcceptInput ||
           c[program_counter_].command_type == kProvideOutput)) {
     pending_commands_.push_back(program_counter_);
     program_counter_++;
   }
   for (size_t i = 0; i < pending_commands_.size(); i++) {
     // the order here doesn't really matter; we go from back to front
     // as it's more efficient, not that efficiency really matters here.
     int32 command = pending_commands_[i];
     if (c[command].command_type == kAcceptInput) {
       // we can't ignore if we needed input from the user that hasn't been
       // provided.
       int32 node = c[command].arg2;
       KALDI_ERR << "Cannot run computation-- we did not get input for node '"
                 << nnet_.GetNodeName(node) << "'";
     }
   }
   pending_commands_.clear();
 }

 int32 NnetComputer::GetIoMatrixIndex(const std::string &node_name, bool is_output) {
   const std::vector<NnetComputation::Command> &c = computation_.commands;
   int32 node_index = nnet_.GetNodeIndex(node_name);
   if (node_index == -1)
     KALDI_ERR << "No node named '" << node_name << "'in network.";
   // first make sure all the I/O commands that we immediately expect, are listed
   // in 'pending_commands_'.
   while (program_counter_ < static_cast<int32>(computation_.commands.size()) &&
          ((c[program_counter_].command_type == kAcceptInput ||
            c[program_counter_].command_type == kProvideOutput ||
            c[program_counter_].command_type == kNoOperationMarker))) {
     if (c[program_counter_].command_type != kNoOperationMarker)
       pending_commands_.push_back(program_counter_);
     program_counter_++;
   }
   for (size_t i = 0; i < pending_commands_.size(); i++) {
     int32 command = pending_commands_[i];
     bool this_command_is_output =
         (c[command].command_type == kProvideOutput);
     int32 this_submatrix_index = c[command].arg1,
         this_node_index = c[command].arg2;
     if (this_command_is_output == is_output && node_index == this_node_index) {
       if (!is_output) {
         pending_commands_.erase(pending_commands_.begin() + i);
         // don't erase the command for outputs, as that would prevent things
         // from being output twice, which is an unnecessary restriction.
       }
       if (!(computation_.IsWholeMatrix(this_submatrix_index)))
         KALDI_ERR << "Getting input or output that is not a whole matrix "
                   << "(probably some optimization code needs to be changed)";
       return computation_.submatrices[this_submatrix_index].matrix_index;
     }
   }
   // if you get the following error it will likely be a bug in the calling code,
   // or possibly due to giving the wrong egs.
   KALDI_ERR << "Could not "
             << (is_output ? "provide output " : "accept input ")
             << "for network node " << node_name
             << " (it is not expected at this point in the computation)";
   return 0;  // Suppress compiler warnings; this line will never be reached.
 }


 void NnetComputer::AcceptInputs(const Nnet &nnet,
                                 const std::vector<NnetIo> &io_vec) {
   for (size_t i = 0; i < io_vec.size(); i++) {
     const NnetIo &io = io_vec[i];
     int32 node_index = nnet.GetNodeIndex(io.name);
     if (node_index == -1)
       KALDI_ERR << "No node named '" << io.name << "' in nnet.";
     if (nnet.IsInputNode(node_index)) {
       CuMatrix<BaseFloat> cu_input(io.features.NumRows(),
                                    io.features.NumCols(),
                                    kUndefined);
       cu_input.CopyFromGeneralMat(io.features);
       this->AcceptInput(io.name, &cu_input);
     }
   }
 }

 NnetComputer::~NnetComputer() {
   // Delete any pointers that are present in compressed_matrices_.  Actually
   // they should all already have been deallocated and set to NULL if the
   // compuation was run to completion; we do this in case someone ran
   // the forward propagation but not the backprop.
   for (size_t i = 0; i < compressed_matrices_.size(); i++)
     delete compressed_matrices_[i];
 }

 } // namespace nnet3
 } // namespace kaldi
kaldi::nnet3::NnetComputer::GetPointers
void GetPointers(int32 indexes_multi_index, int32 num_cols, CuArray< BaseFloat *> *pointers)
Definition: nnet-compute.cc:459

kaldi::nnet3::ComputationVariables::Init
void Init(const NnetComputation &computation)
Definition: nnet-analyze.cc:133

kaldi::nnet3::NnetComputation::Command::arg2
int32 arg2
Definition: nnet-computation.h:342

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::NnetIo
Definition: nnet-example.h:33

nnet-compute.h

kaldi::CuMatrixBase::Stride
MatrixIndexT Stride() const
Definition: cu-matrix.h:217

kaldi::nnet3::kMatrixCopy
Definition: nnet-computation.h:291

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::nnet3::Component::Propagate
virtual void * Propagate(const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const =0
Propagate function.

kaldi::CuArray::CopyFromVec
void CopyFromVec(const std::vector< T > &src)
This function resizes if needed.
Definition: cu-array-inl.h:120

kaldi::nnet3::NnetComputer::CommandDebugInfo::matrices_written_stddevs
std::vector< BaseFloat > matrices_written_stddevs
Definition: nnet-compute.h:209

kaldi::kStrideEqualNumCols
Definition: matrix-common.h:46

kaldi::nnet3::NnetComputer::program_counter_
int32 program_counter_
Definition: nnet-compute.h:136

kaldi::nnet3::NnetComputation::Command::arg7
int32 arg7
Definition: nnet-computation.h:347

kaldi::nnet3::Nnet::GetNodeName
const std::string & GetNodeName(int32 node_index) const
returns individual node name.
Definition: nnet-nnet.cc:684

kaldi::nnet3::kNoOperationPermanent
Definition: nnet-computation.h:295

kaldi::nnet3::kSwapMatrix
Definition: nnet-computation.h:289

kaldi::nnet3::Component
Abstract base-class for neural-net components.
Definition: nnet-component-itf.h:114

kaldi::CuMatrixBase::AddRows
void AddRows(Real alpha, const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Does for each row r, this.Row(r) += alpha * src.row(indexes[r]).
Definition: cu-matrix.cc:2766

kaldi::CuMatrixBase::AddRowRanges
void AddRowRanges(const CuMatrixBase< Real > &src, const CuArrayBase< Int32Pair > &indexes)
For each row r of this and for each column c, do (*this)(r, c) +=  src(j, c), where j ranges from ind...
Definition: cu-matrix.cc:2931

kaldi::GetVerboseLevel
int32 GetVerboseLevel()
Get verbosity level, usually set via command line &#39;–verbose=&#39; switch.
Definition: kaldi-error.h:60

kaldi::nnet3::kProvideOutput
Definition: nnet-computation.h:294

kaldi::nnet3::NnetComputer::options_
const NnetComputeOptions & options_
Definition: nnet-compute.h:132

kaldi::nnet3::kNoOperation
Definition: nnet-computation.h:295

kaldi::nnet3::kUpdatableComponent
Definition: nnet-component-itf.h:42

kaldi::nnet3::NnetComputer::Init
void Init()
Definition: nnet-compute.cc:48

kaldi::nnet3::UpdatableComponent::NumParameters
virtual int32 NumParameters() const
The following new virtual function returns the total dimension of the parameters in this class...
Definition: nnet-component-itf.h:530

kaldi::nnet3::NnetComputation::SubMatrixInfo
Definition: nnet-computation.h:323

kaldi::nnet3::NnetComputation::Print
void Print(std::ostream &os, const Nnet &nnet) const
Definition: nnet-computation.cc:717

kaldi::nnet3::NnetComputer::command_attributes_
std::vector< CommandAttributes > command_attributes_
Definition: nnet-compute.h:153

kaldi::nnet3::NnetComputeOptions::debug
bool debug
Definition: nnet-compute.h:40

kaldi::nnet3::NnetComputer::GetMemo
void * GetMemo(int32 memo_index)
Definition: nnet-compute.cc:176

kaldi::nnet3::Nnet::IsInputNode
bool IsInputNode(int32 node) const
Returns true if this is an output node, meaning that it is of type kInput.
Definition: nnet-nnet.cc:120

kaldi::nnet3::kCopyRowsMulti
Definition: nnet-computation.h:292

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::NnetComputation::Command::arg6
int32 arg6
Definition: nnet-computation.h:346

kaldi::nnet3::NnetIo::features
GeneralMatrix features
The features or labels.
Definition: nnet-example.h:46

kaldi::nnet3::kDeallocMatrix
Definition: nnet-computation.h:289

kaldi::CuMatrixBase::AddMat
void AddMat(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType trans=kNoTrans)
*this += alpha * A
Definition: cu-matrix.cc:954

kaldi::nnet3::NnetComputation::matrices
std::vector< MatrixInfo > matrices
Definition: nnet-computation.h:390

kaldi::nnet3::kGotoLabel
Definition: nnet-computation.h:296

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet3::kCopyRows
Definition: nnet-computation.h:291

kaldi::nnet3::kAddRows
Definition: nnet-computation.h:291

kaldi::nnet3::NnetComputer::NnetComputer
NnetComputer(const NnetComputeOptions &options, const NnetComputation &computation, const Nnet &nnet, Nnet *nnet_to_update)
Constructor.
Definition: nnet-compute.cc:28

kaldi::nnet3::Component::DeleteMemo
virtual void DeleteMemo(void *memo) const
This virtual function only needs to be overwritten by Components that return a non-NULL memo from the...
Definition: nnet-component-itf.h:376

kaldi::nnet3::ComputeCommandAttributes
void ComputeCommandAttributes(const Nnet &nnet, const NnetComputation &computation, const ComputationVariables &vars, std::vector< CommandAttributes > *attributes)
Definition: nnet-analyze.cc:284

kaldi::nnet3::kAcceptInput
Definition: nnet-computation.h:294

kaldi::nnet3::kCompressMatrix
Definition: nnet-computation.h:293

kaldi::nnet3::NnetComputation::commands
std::vector< Command > commands
Definition: nnet-computation.h:439

kaldi::nnet3::kAllocMatrix
Definition: nnet-computation.h:289

kaldi::nnet3::NnetComputation::MatrixInfo::stride_type
MatrixStrideType stride_type
Definition: nnet-computation.h:307

kaldi::nnet3::NnetComputeOptions
Definition: nnet-compute.h:39

kaldi::nnet3::NnetComputer::CommandDebugInfo::submatrices_written_stddevs
std::vector< BaseFloat > submatrices_written_stddevs
Definition: nnet-compute.h:213

kaldi::nnet3::kSetConst
Definition: nnet-computation.h:289

kaldi::nnet3::Component::Backprop
virtual void Backprop(const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const =0
Backprop function; depending on which of the arguments &#39;to_update&#39; and &#39;in_deriv&#39; are non-NULL...

kaldi::nnet3::NnetComputer::~NnetComputer
~NnetComputer()
Definition: nnet-compute.cc:680

kaldi::nnet3::kMatrixAdd
Definition: nnet-computation.h:291

kaldi::nnet3::NnetComputation::Command::arg4
int32 arg4
Definition: nnet-computation.h:344

kaldi::nnet3::NnetComputation::Command::arg1
int32 arg1
Definition: nnet-computation.h:341

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::CuMatrixBase::Scale
void Scale(Real value)
Definition: cu-matrix.cc:644

kaldi::nnet3::kNoOperationMarker
Definition: nnet-computation.h:295

kaldi::nnet3::NnetComputer::AcceptInput
void AcceptInput(const std::string &node_name, CuMatrix< BaseFloat > *input)
e.g.
Definition: nnet-compute.cc:547

kaldi::GeneralMatrix::NumCols
MatrixIndexT NumCols() const
Definition: sparse-matrix.cc:791

kaldi::nnet3::kCopyToRowsMulti
Definition: nnet-computation.h:292

kaldi::nnet3::NnetComputer::pending_commands_
std::vector< int32 > pending_commands_
Definition: nnet-compute.h:141

kaldi::nnet3::NnetComputer::nnet_
const Nnet & nnet_
Definition: nnet-compute.h:134

kaldi::nnet3::NnetComputation::MatrixInfo
Definition: nnet-computation.h:304

kaldi::nnet3::NnetComputer::compressed_matrices_
std::vector< CuCompressedMatrixBase * > compressed_matrices_
Definition: nnet-compute.h:173

kaldi::nnet3::NnetComputation::GetCommandStrings
void GetCommandStrings(const Nnet &nnet, std::string *preamble, std::vector< std::string > *command_strings) const
Definition: nnet-computation.cc:944

kaldi::nnet3::NnetComputation::indexes_cuda
std::vector< CuArray< int32 > > indexes_cuda
Definition: nnet-computation.h:445

kaldi::nnet3::NnetComputer::ExecuteCommand
void ExecuteCommand()
Definition: nnet-compute.cc:210

kaldi::nnet3::ComputationVariables
This class relates the matrices and sub-matrices in the computation to imaginary "variables", such that we can think of the operations as operating on sets of individual variables, and we can then do analysis that lets us do optimization.
Definition: nnet-analyze.h:121

kaldi::nnet3::NnetComputation::need_model_derivative
bool need_model_derivative
Definition: nnet-computation.h:442

kaldi::nnet3::NnetComputation::MatrixInfo::num_cols
int32 num_cols
Definition: nnet-computation.h:306

kaldi::nnet3::NnetComputer::GetOutput
const CuMatrixBase< BaseFloat > & GetOutput(const std::string &node_name)
Definition: nnet-compute.cc:578

kaldi::nnet3::NnetComputer::DebugBeforeExecute
void DebugBeforeExecute(int32 command, CommandDebugInfo *info)
Definition: nnet-compute.cc:82

float

kaldi::nnet3::NnetComputation::indexes_multi
std::vector< std::vector< std::pair< int32, int32 > > > indexes_multi
Definition: nnet-computation.h:425

kaldi::nnet3::NnetComputer::nnet_to_store_stats_
Nnet * nnet_to_store_stats_
Definition: nnet-compute.h:146

kaldi::nnet3::NnetComputer::CheckNoPendingIo
void CheckNoPendingIo()
Definition: nnet-compute.cc:597

kaldi::nnet3::Component::StoreStats
virtual void StoreStats(const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, void *memo)
This function may store stats on average activation values, and for some component types...
Definition: nnet-component-itf.h:186

kaldi::nnet3::UpdatableComponent::DotProduct
virtual BaseFloat DotProduct(const UpdatableComponent &other) const =0
Computes dot-product between parameters of two instances of a Component.

kaldi::nnet3::Component::Properties
virtual int32 Properties() const =0
Return bitmask of the component&#39;s properties.

kaldi::nnet3::NnetComputation::Command::alpha
BaseFloat alpha
Definition: nnet-computation.h:340

kaldi::CuMatrixBase::AddToRows
void AddToRows(Real alpha, const CuArrayBase< MatrixIndexT > &indexes, CuMatrixBase< Real > *dst) const
For each row i of *this, adds this->Row(i) to dst->Row(indexes(i)) if indexes(i) >= 0...
Definition: cu-matrix.cc:2869

kaldi::CuMatrixBase::SetZero
void SetZero()
Math operations, some calling kernels.
Definition: cu-matrix.cc:509

kaldi::nnet3::NnetComputer::AcceptInputs
void AcceptInputs(const Nnet &nnet, const std::vector< NnetIo > &io)
This convenience function calls AcceptInput() in turn on all the inputs in the training example...
Definition: nnet-compute.cc:663

kaldi::kDefaultStride
Definition: matrix-common.h:45

kaldi::nnet3::NnetComputer::ParameterStddev
static BaseFloat ParameterStddev(const Component &c)
Definition: nnet-compute.cc:75

kaldi::nnet3::NnetComputer::CommandDebugInfo::components_parameter_stddev
BaseFloat components_parameter_stddev
Definition: nnet-compute.h:217

kaldi::nnet3::NnetComputation::submatrices
std::vector< SubMatrixInfo > submatrices
Definition: nnet-computation.h:404

kaldi::CuMatrixBase::CopyRows
void CopyRows(const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Copies row r from row indexes[r] of src.
Definition: cu-matrix.cc:2678

kaldi::nnet3::NnetComputation::Command
Definition: nnet-computation.h:338

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

KALDI_PARANOID_ASSERT
#define KALDI_PARANOID_ASSERT(cond)
Definition: kaldi-error.h:206

kaldi::nnet3::NnetComputer::GetIoMatrixIndex
int32 GetIoMatrixIndex(const std::string &node_name, bool is_output)
Definition: nnet-compute.cc:620

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::nnet3::kAddRowsMulti
Definition: nnet-computation.h:292

kaldi::TraceMatMat
Real TraceMatMat(const MatrixBase< Real > &A, const MatrixBase< Real > &B, MatrixTransposeType trans)
We need to declare this here as it will be a friend function.
Definition: kaldi-matrix.cc:2692

kaldi::nnet3::NnetComputation::indexes_ranges_cuda
std::vector< CuArray< Int32Pair > > indexes_ranges_cuda
Definition: nnet-computation.h:448

kaldi::nnet3::Nnet::GetComponentName
const std::string & GetComponentName(int32 component_index) const
returns individual component name.
Definition: nnet-nnet.cc:689

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

kaldi::nnet3::NnetComputation::Command::command_type
CommandType command_type
Definition: nnet-computation.h:339

kaldi::nnet3::kBackpropNoModelUpdate
Definition: nnet-computation.h:290

kaldi::nnet3::NnetComputer::computation_
const NnetComputation & computation_
Definition: nnet-compute.h:133

kaldi::nnet3::Nnet::GetComponent
Component * GetComponent(int32 c)
Return component indexed c. Not a copy; not owned by caller.
Definition: nnet-nnet.cc:150

kaldi::Timer
Definition: timer.h:63

kaldi::nnet3::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters; it extends the interface of C...
Definition: nnet-component-itf.h:455

kaldi::nnet3::NnetComputer::matrices_
std::vector< CuMatrix< BaseFloat > > matrices_
Definition: nnet-compute.h:160

kaldi::CuMatrixBase::CopyFromGeneralMat
void CopyFromGeneralMat(const GeneralMatrix &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:3096

kaldi::nnet3::NnetComputation::component_precomputed_indexes
std::vector< PrecomputedIndexesInfo > component_precomputed_indexes
Definition: nnet-computation.h:412

kaldi::nnet3::NnetComputer::CommandDebugInfo
Definition: nnet-compute.h:205

kaldi::CuMatrixBase::Data
const Real * Data() const
Return data pointer (const).
Definition: cu-matrix.h:746

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::NnetComputer::SaveMemo
void SaveMemo(int32 memo_index, const Component &c, void *memo)
Definition: nnet-compute.cc:163

kaldi::nnet3::kBackprop
Definition: nnet-computation.h:290

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::nnet3::NnetComputer::submatrix_strings_
std::vector< std::string > submatrix_strings_
Definition: nnet-compute.h:155

kaldi::nnet3::ComponentPrecomputedIndexes
Definition: nnet-component-itf.h:97

kaldi::nnet3::NnetComputer
class NnetComputer is responsible for executing the computation described in the "computation" object...
Definition: nnet-compute.h:59

kaldi::nnet3::kNoOperationLabel
Definition: nnet-computation.h:295

kaldi::CuArray< int32 >

kaldi::nnet3::NnetComputation
Definition: nnet-computation.h:303

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::GeneralMatrix::NumRows
MatrixIndexT NumRows() const
Definition: sparse-matrix.cc:781

NVTX_RANGE
#define NVTX_RANGE(name)
Definition: cu-common.h:143

kaldi::nnet3::NnetComputation::Command::arg5
int32 arg5
Definition: nnet-computation.h:345

kaldi::nnet3::NnetIo::name
std::string name
the name of the input in the neural net; in simple setups it will just be "input".
Definition: nnet-example.h:36

kaldi::nnet3::kPropagate
Definition: nnet-computation.h:290

kaldi::nnet3::NnetComputer::command_strings_
std::vector< std::string > command_strings_
Definition: nnet-compute.h:157

kaldi::nnet3::NnetComputer::MatrixStddev
static BaseFloat MatrixStddev(const CuMatrixBase< BaseFloat > &m)
Definition: nnet-compute.cc:68

kaldi::nnet3::NnetComputation::indexes
std::vector< std::vector< int32 > > indexes
Definition: nnet-computation.h:419

kaldi::CuMatrixBase::CopyToRows
void CopyToRows(const CuArrayBase< Real *> &dst) const
For each row r of this matrix, copies it to the array of floats at the location given by dst[r]...
Definition: cu-matrix.cc:2744

kaldi::nnet3::NnetComputer::GetOutputDestructive
void GetOutputDestructive(const std::string &output_name, CuMatrix< BaseFloat > *output)
Definition: nnet-compute.cc:587

kaldi::nnet3::Nnet::GetNodeIndex
int32 GetNodeIndex(const std::string &node_name) const
returns index associated with this node name, or -1 if no such index.
Definition: nnet-nnet.cc:466

kaldi::nnet3::kAddToRowsMulti
Definition: nnet-computation.h:292

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::nnet3::kDecompressMatrix
Definition: nnet-computation.h:293

kaldi::CuCompressedMatrixBase
Class CuCompressedMatrixBase is an abstract base class that allows you to compress a matrix of type C...
Definition: cu-compressed-matrix.h:35

kaldi::nnet3::NnetComputation::MatrixInfo::num_rows
int32 num_rows
Definition: nnet-computation.h:305

kaldi::nnet3::NnetComputer::nnet_to_update_
Nnet * nnet_to_update_
Definition: nnet-compute.h:150

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::Timer::Elapsed
double Elapsed() const
Returns time in seconds.
Definition: timer.h:74

kaldi::nnet3::NnetComputer::GetSubMatrix
CuSubMatrix< BaseFloat > GetSubMatrix(int32 submatrix_index)
Definition: nnet-compute.cc:449

kaldi::nnet3::kAddRowRanges
Definition: nnet-computation.h:293

kaldi::CuMatrixBase::Set
void Set(Real value)
Definition: cu-matrix.cc:531

kaldi::CuCompressedMatrixBase::NumRows
virtual int32 NumRows() const =0

kaldi::nnet3::NnetComputer::debug_
bool debug_
Definition: nnet-compute.h:151

kaldi::nnet3::NnetComputation::IsWholeMatrix
bool IsWholeMatrix(int32 submatrix_index) const
Definition: nnet-computation.cc:975

kaldi::NewCuCompressedMatrix
CuCompressedMatrixBase * NewCuCompressedMatrix(CuCompressedMatrixType t, BaseFloat range, bool truncat)
This function allocates a new CuCompressedMatrix with type determined by t, and with the &#39;range&#39; and ...
Definition: cu-compressed-matrix.cc:119

kaldi::CuMatrix::Resize
void Resize(MatrixIndexT rows, MatrixIndexT cols, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Allocate the memory.
Definition: cu-matrix.cc:50

kaldi::nnet3::NnetComputation::Command::arg3
int32 arg3
Definition: nnet-computation.h:343

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95

kaldi::nnet3::NnetComputer::memos_
std::vector< void * > memos_
Definition: nnet-compute.h:165

kaldi::CuCompressedMatrixBase::NumCols
virtual int32 NumCols() const =0

kaldi::CuCompressedMatrixBase::CopyToMat
virtual void CopyToMat(CuMatrixBase< BaseFloat > *mat) const =0
Copies the contents of *this to &#39;mat&#39;, which should be correctly sized beforehand.

kaldi::nnet3::NnetComputation::GetSubmatrixStrings
void GetSubmatrixStrings(const Nnet &nnet, std::vector< std::string > *submat_strings) const
Definition: nnet-computation.cc:424

kaldi::nnet3::NnetComputer::DebugAfterExecute
void DebugAfterExecute(int32 command, const CommandDebugInfo &info, double command_execution_time)
Definition: nnet-compute.cc:116

kaldi::nnet3::NnetComputer::Run
void Run()
This does either the forward or backward computation, depending when it is called (in a typical compu...
Definition: nnet-compute.cc:512

kaldi::nnet3::NnetComputation::indexes_ranges
std::vector< std::vector< std::pair< int32, int32 > > > indexes_ranges
Definition: nnet-computation.h:430