doc/nnet3-xvector-compute-batched_8cc_source.html

 // nnet3bin/nnet3-xvector-compute.cc

 // Copyright 2019   Daniel Povey
 //           2017   Johns Hopkins University (author: Daniel Povey)
 //           2017   Johns Hopkins University (author: Daniel Garcia-Romero)
 //           2017   David Snyder

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "nnet3/nnet-am-decodable-simple.h"
 #include "base/timer.h"
 #include "nnet3/nnet-utils.h"

 namespace kaldi {
 namespace nnet3 {


 struct BatchedXvectorComputerOptions {
   int32 chunk_size { 150 };
   int32 batch_size { 32 };
   bool pad_input { true };
   NnetComputeOptions compute_config;
   NnetOptimizeOptions optimize_config;
   CachingOptimizingCompilerOptions compiler_config;


   void Register(OptionsItf *po) {
     po->Register("chunk-size", &chunk_size,
                  "Size of chunk, in input frames.  Includes the nnet "
                  "context, so the number of chunks will be more than "
                  "total-input-frames / chunk-size.");
     po->Register("batch-size", &batch_size,
                  "Size of the batches of chunks that we compute at once. ");
     po->Register("pad-input", &pad_input,
                  "If true, for utterances shorter than `chunk-size` frames "
                  "we will pad with repeats of the last frame.");
     compute_config.Register(po);
     optimize_config.Register(po);
     compiler_config.Register(po);
   }
 };


 void DivideIntoPieces(int32 a, int32 b, std::vector<int32> *pieces) {
   KALDI_ASSERT(b > 0);
   pieces->clear();
   pieces->reserve(b);
   int32 a_sign = 1;
   // Make sure a is positive before division, because the behavior of division
   // with negative operands is not fully defined in C.
   if (a < 0) {
     a_sign = -1;
     a *= -1;
   }
   int32 piece_size1 = a / b,
       piece_size2 = piece_size1 + 1,
       remainder = a % b;
   int32 num_pieces_of_size1 = b - remainder,
       num_pieces_of_size2 = remainder;
   KALDI_ASSERT(a == num_pieces_of_size1 * piece_size1 +
                num_pieces_of_size2 * piece_size2);

   for (int32 i = 0; i < num_pieces_of_size1; i++)
     pieces->push_back(piece_size1 * a_sign);
   for (int32 i = 0; i < num_pieces_of_size2; i++)
     pieces->push_back(piece_size2 * a_sign);
 }


 class BatchedXvectorComputer {
  public:
   BatchedXvectorComputer(const BatchedXvectorComputerOptions &opts,
                          const Nnet &nnet,
                          int32 total_context);

   void AcceptUtterance(const std::string &utt,
                       const Matrix<BaseFloat> &input);


   bool XvectorReady() const;

   void OutputXvector(std::string *utt,
                      Vector<BaseFloat> *xvector);


   void Flush();


  private:

   struct XvectorTask {
     std::string utt_id;
     int32 num_chunks;
     int32 num_chunks_finished;
     Vector<BaseFloat> xvector;
     XvectorTask *tail;
   };


   void SplitUtteranceIntoChunks(int32 num_frames,
                                 std::vector<int32> *start_frames);

   XvectorTask* CreateTask(const std::string &utt, int32 num_chunks);


   void ComputeOneBatch();

   void AddChunkToBatch(XvectorTask *task,
                        const Matrix<BaseFloat> &input,
                        int32 chunk_start);

   const BatchedXvectorComputerOptions &opts_;
   int32 total_context_;
   const Nnet &nnet_;

   int32 feature_dim_;
   int32 xvector_dim_;

   Matrix<BaseFloat> input_feats_;


   std::shared_ptr<const NnetComputation> computation_;


   int32 position_in_batch_;

   std::vector<XvectorTask*> tasks_this_batch_;

   // results_head_ is the first element in the singly linked list of
   // already-computed xvectors, or NULL if that list is empty.  Note:
   // utterances that are ready will appear here first; new utterances
   // get added to the tail.
   XvectorTask *results_head_;
   // results_tail_ is the last element in the singly linked list of
   // already-computed xvectors, or NULL if the list is empty.
   XvectorTask *results_tail_;
 };

 BatchedXvectorComputer::XvectorTask*
 BatchedXvectorComputer::CreateTask(
     const std::string &utt, int32 num_chunks) {
   XvectorTask *task = new XvectorTask;
   task->utt_id = utt;
   task->num_chunks = num_chunks;
   task->num_chunks_finished = 0;
   task->xvector.Resize(xvector_dim_);
   task->tail = NULL;
   if (results_tail_) {
     results_tail_->tail = task;
     results_tail_ = task;
   } else {  // List was previously empty.
     results_head_ = task;
     results_tail_ = task;
   }
   return task;
 }

 BatchedXvectorComputer::BatchedXvectorComputer(
     const BatchedXvectorComputerOptions &opts,
     const Nnet &nnet,
     int32 total_context):
     opts_(opts),
     total_context_(total_context),
     nnet_(nnet),
     position_in_batch_(0),
     results_head_(NULL),
     results_tail_(NULL) {

   tasks_this_batch_.resize(opts_.batch_size);

   feature_dim_ = nnet.InputDim("input");
   xvector_dim_ = nnet.OutputDim("output");
   // Zero input_feats_ in case there is only one batch, to avoid
   // NaN's being generated due to undefined data.
   input_feats_.Resize(opts_.chunk_size * opts_.batch_size,
                       feature_dim_);

   CachingOptimizingCompiler compiler(nnet, opts.optimize_config,
                                      opts.compiler_config);

   {  // This block creates computation_.
     ComputationRequest request;
     request.need_model_derivative = false;
     request.store_component_stats = false;
     request.inputs.resize(1);
     IoSpecification &input(request.inputs[0]);
     input.name = "input";
     input.has_deriv = false;
     input.indexes.resize(opts_.batch_size * opts_.chunk_size);
     // Note: the sequences are interleaved in the input; this will save an extra
     // copy since it corresponds to how nnet3 stores things by default.  (Makes
     // TDNNs easier to implement.)
     for (int32 n = 0; n < opts_.batch_size; n++) {
       for (int32 t = 0; t < opts_.chunk_size; t++) {
         Index index;
         index.n = n;
         index.t = t;
         // index.x is 0 by default.
         input.indexes[n + opts_.batch_size * t] = index;
       }
     }
     IoSpecification output;
     output.name = "output";
     output.has_deriv = false;
     output.indexes.resize(opts_.batch_size);
     for (int32 n = 0; n < opts_.batch_size; n++){
         Index index;
         index.n = n;
         index.t = 0;
         output.indexes[n] = index;
     }
     request.outputs.push_back(output);
     computation_ = compiler.Compile(request);
   }
 }

 void BatchedXvectorComputer::AddChunkToBatch(
     XvectorTask *task,
     const Matrix<BaseFloat> &input,
     int32 chunk_start) {
   int32 n = position_in_batch_++;
   KALDI_ASSERT(n >= 0 && n < opts_.batch_size);
   tasks_this_batch_[n] = task;
   int32 T = opts_.chunk_size,
       num_input_frames = input.NumRows();
   KALDI_ASSERT(input_feats_.NumRows() == T * opts_.batch_size);
   if (input.NumCols() != feature_dim_) {
     KALDI_ERR << "Feature dimension mismatch: neural net expected "
               << feature_dim_ << ", got " << input.NumCols();
   }
   for (int32 t = 0; t < T; t++) {
     SubVector<BaseFloat> dest(input_feats_, t * opts_.batch_size + n);
     int32 src_t = t + chunk_start;
     if (src_t >= num_input_frames) {
       KALDI_ASSERT(opts_.pad_input);
       src_t = num_input_frames - 1;  // Pad with repeats of the last frame.
     }
     SubVector<BaseFloat> src(input, src_t);
     dest.CopyFromVec(src);
   }
 }

 bool BatchedXvectorComputer::XvectorReady() const {
   if (results_head_ == NULL)
     return false;
   KALDI_ASSERT(results_head_->num_chunks_finished <= results_head_->num_chunks);
   return results_head_->num_chunks_finished == results_head_->num_chunks;
 }

 void BatchedXvectorComputer::OutputXvector(std::string *utt,
                                            Vector<BaseFloat> *xvector) {
   KALDI_ASSERT(XvectorReady());
   *utt = results_head_->utt_id;
   xvector->Swap(&(results_head_->xvector));
   XvectorTask *new_tail = results_head_->tail;
   delete results_head_;
   results_head_ = new_tail;
   if (new_tail == NULL)
     results_tail_ = NULL;
 }

 void BatchedXvectorComputer::Flush() {
   if (position_in_batch_ == 0)
     return;
   ComputeOneBatch();
 }


 void BatchedXvectorComputer::ComputeOneBatch() {

   CuMatrix<BaseFloat> cu_input_feats(input_feats_);
   Nnet *nnet_to_update = NULL;  // we're not doing any update.
   NnetComputer computer(opts_.compute_config, *computation_,
                         nnet_, nnet_to_update);
   computer.AcceptInput("input", &cu_input_feats);
   computer.Run();
   CuMatrix<BaseFloat> cu_output;
   computer.GetOutputDestructive("output", &cu_output);
   KALDI_ASSERT(cu_output.NumRows() == opts_.batch_size);
   Matrix<BaseFloat> output(cu_output);
   for (int32 n = 0; n < opts_.batch_size; n++) {
     XvectorTask *task = tasks_this_batch_[n];
     if (task == NULL)
       continue;  // Would only happen for the last batch.
     task->num_chunks_finished++;
     task->xvector.AddVec(1.0 / task->num_chunks, output.Row(n));
   }
   position_in_batch_ = 0;
   std::fill(tasks_this_batch_.begin(), tasks_this_batch_.end(),
             (XvectorTask*)NULL);
 }

 void BatchedXvectorComputer::AcceptUtterance(
     const std::string &utt,
     const Matrix<BaseFloat> &input) {
   std::vector<int32> chunk_starts;
   int32 num_frames = input.NumRows();
   SplitUtteranceIntoChunks(num_frames, &chunk_starts);
   int32 num_chunks = chunk_starts.size();
   XvectorTask *task = CreateTask(utt, num_chunks);

   for (int32 i = 0; i < num_chunks; i++) {
     AddChunkToBatch(task, input, chunk_starts[i]);
     if (position_in_batch_ == opts_.batch_size) {
       ComputeOneBatch();
     }
   }
 }

 void BatchedXvectorComputer::SplitUtteranceIntoChunks(
     int32 num_frames, std::vector<int32> *start_frames) {
   start_frames->clear();
   if (num_frames <= opts_.chunk_size) {
     if (num_frames == opts_.chunk_size || opts_.pad_input)
       start_frames->push_back(0);
     // if we leave start_frames empty, then we just won't compute anything for
     // this file.
   } else {
     // these modified quantities are to account for the context effects...  when
     // the chunks overlap by exactly total_context_, the frames that get
     // averaged by the respective chunks in their averaging layers would touch
     // but not overlap.  So the optimal separation between chunks would equal
     // opts_.chunk_size - total_context_.
     int32 modified_num_frames = num_frames - total_context_,
         modified_chunk_size = opts_.chunk_size - total_context_;
     KALDI_ASSERT(modified_num_frames > modified_chunk_size);
     int32 num_chunks1 = modified_num_frames / modified_chunk_size,
         num_chunks2 = num_chunks1 + 1;
     int32 num_frames1 = num_chunks1 * modified_chunk_size,
         num_frames2 = num_chunks2 * modified_chunk_size;
     KALDI_ASSERT(num_frames2 > modified_chunk_size);
     // The M and N below correspond to the M and N in the comment:
     // M is the number of frames repeated once in the averaging, N
     // the number of frames repeated twice.  (Basically a solution
     // of the equations: (M + 2N == num_frames2, M+N == modified_num_frames).
     // Note: by a "frame" above, I mean a specific "t" value in
     // the utterance.
     int32 N = num_frames2 - modified_num_frames,
         M = modified_num_frames - N;
     KALDI_ASSERT(M + 2*N == num_frames2 && M + N == modified_num_frames);

     // The variances below are proportional to the variance of our
     // estimate of the xvector under certain simplifying assumptions..
     // they help us choose whether to have gaps between the chunks
     // or overlaps between them.
     BaseFloat variance1 = 1.0 / num_frames1,  // the 1/M mentioned above.
         variance2 = (M + 4.0*N) / ((M + 2.0*N)*(M + 2.0*N));
     if (variance1 <= variance2) {
       // We'll choose the smaller number of chunks.  There may be gaps.
       // Counting the positions at the ends, there are num_chunks+1 positions
       // where there might be gaps.
       // Note: "total_gap" is >= 0, it's the positive of the sum of the
       // sizes of those gaps.
       int32 num_chunks = num_chunks1,
           num_gaps = num_chunks + 1,
           total_gap = modified_num_frames - num_chunks * modified_chunk_size;
       KALDI_ASSERT(0 <= total_gap && total_gap < modified_chunk_size);
       std::vector<int32> gap_sizes;  // elements will be >= 0.
       DivideIntoPieces(total_gap, num_gaps, &gap_sizes);
       int32 pos = gap_sizes[0];
       for (int32 i = 0; i < num_chunks; i++) {
         start_frames->push_back(pos);
         pos += modified_chunk_size + gap_sizes[i + 1];
       }
       KALDI_ASSERT(pos == modified_num_frames);
     } else {
       int32 num_chunks = num_chunks2,
           num_overlaps = num_chunks - 1,
           total_overlap = modified_num_frames - num_chunks * modified_chunk_size;
       KALDI_ASSERT( -modified_chunk_size < total_overlap && total_overlap <= 0 );
       std::vector<int32> overlap_sizes;  // elements will be <= 0.
       DivideIntoPieces(total_overlap, num_overlaps, &overlap_sizes);
       int32 pos = 0;
       for (int32 i = 0; i < num_chunks; i++) {
         start_frames->push_back(pos);
         pos += modified_chunk_size;
         if (i < num_overlaps)
           pos += overlap_sizes[i];
       }
       KALDI_ASSERT(pos == modified_num_frames);
     }
   }
 }


 } // namespace nnet3
 } // namespace kaldi

 int main(int argc, char *argv[]) {
   try {
     using namespace kaldi;
     using namespace kaldi::nnet3;
     typedef kaldi::int32 int32;
     typedef kaldi::int64 int64;

     const char *usage =
         "Propagate features through an xvector neural network model and write\n"
         "the output vectors.  \"Xvector\" is our term for a vector or\n"
         "embedding which is the output of a particular type of neural network\n"
         "architecture found in speaker recognition.  This architecture\n"
         "consists of several layers that operate on frames, a statistics\n"
         "pooling layer that aggregates over the frame-level representations\n"
         "and possibly additional layers that operate on segment-level\n"
         "representations.  The xvectors are generally extracted from an\n"
         "output layer after the statistics pooling layer.  By default, one\n"
         "xvector is extracted directly from the set of features for each\n"
         "utterance.  Optionally, xvectors are extracted from chunks of input\n"
         "features and averaged, to produce a single vector.\n"
         "\n"
         "Usage: nnet3-xvector-compute [options] <raw-nnet-in> "
         "<features-rspecifier> <vector-wspecifier>\n"
         "e.g.: nnet3-xvector-compute final.raw scp:feats.scp "
         "ark:nnet_prediction.ark\n"
         "See also: nnet3-compute\n";

     ParseOptions po(usage);
     Timer timer;

     BatchedXvectorComputerOptions opts;

     std::string use_gpu = "no";

     opts.Register(&po);

     po.Register("use-gpu", &use_gpu,
       "yes|no|optional|wait, only has effect if compiled with CUDA");

 #if HAVE_CUDA==1
     CuDevice::RegisterDeviceOptions(&po);
 #endif
     po.Read(argc, argv);

     if (po.NumArgs() != 3) {
       po.PrintUsage();
       exit(1);
     }

 #if HAVE_CUDA==1
     CuDevice::Instantiate().SelectGpuId(use_gpu);
 #endif

     std::string nnet_rxfilename = po.GetArg(1),
                 feature_rspecifier = po.GetArg(2),
                 vector_wspecifier = po.GetArg(3);

     Nnet nnet;
     ReadKaldiObject(nnet_rxfilename, &nnet);
     SetBatchnormTestMode(true, &nnet);
     SetDropoutTestMode(true, &nnet);
     CollapseModel(CollapseModelConfig(), &nnet);

     int32 total_context;
     {
       int32 left_context, right_context;
       // Compute left_context, right_context as the 'real' left/right context
       // of the network; they'll tell us how many frames on the chunk boundaries
       // won't really participate in the statistics averaging.
       // SetRequireDirectInput()  modifies how the StatisticsPoolingComponent
       // treats its dependences, so we'll get the 'real' left/right context.
       SetRequireDirectInput(true, &nnet);
       ComputeSimpleNnetContext(nnet, &left_context, &right_context);
       KALDI_LOG << "Left/right context is " << left_context << ", "
                 << right_context;
       SetRequireDirectInput(false, &nnet);
       total_context = left_context + right_context;
     }

     BatchedXvectorComputer computer(opts, nnet, total_context);
     BaseFloatVectorWriter vector_writer(vector_wspecifier);

     int32 num_utts_read = 0, num_xvectors_written = 0;
     int64 frame_count = 0;

     SequentialBaseFloatMatrixReader feature_reader(feature_rspecifier);

     for (; !feature_reader.Done(); feature_reader.Next()) {
       std::string utt = feature_reader.Key();
       const Matrix<BaseFloat> &features (feature_reader.Value());
       if (features.NumRows() == 0) {
         KALDI_WARN << "Zero-length utterance: " << utt;
         continue;
       }

       frame_count += features.NumRows();

       computer.AcceptUtterance(utt, features);
       num_utts_read++;

       while (computer.XvectorReady()) {
         std::string utt;
         Vector<BaseFloat> xvector;
         computer.OutputXvector(&utt, &xvector);
         vector_writer.Write(utt, xvector);
         num_xvectors_written++;
       }
     }

     computer.Flush();
     while (computer.XvectorReady()) {
       std::string utt;
       Vector<BaseFloat> xvector;
       computer.OutputXvector(&utt, &xvector);
       vector_writer.Write(utt, xvector);
       num_xvectors_written++;
     }


 #if HAVE_CUDA==1
     CuDevice::Instantiate().PrintProfile();
 #endif
     double elapsed = timer.Elapsed();
     KALDI_LOG << "Time taken "<< elapsed
               << "s: real-time factor assuming 100 frames/sec is "
               << (elapsed*100.0/frame_count);
     KALDI_LOG << "Read " << num_utts_read << " utterances, wrote "
               << num_xvectors_written << " xvectors.";

     // Note: the following rule does something reasonable even if there are 0, 1
     // or 2 utterances read.
     if (num_xvectors_written > num_utts_read / 2)
       return 0;
     else
       return 1;
   } catch(const std::exception &e) {
     std::cerr << e.what();
     return -1;
   }
 }
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::NnetOptimizeOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-optimize.h:84

kaldi::nnet3::Nnet::InputDim
int32 InputDim(const std::string &input_name) const
Definition: nnet-nnet.cc:669

kaldi::nnet3::CollapseModel
void CollapseModel(const CollapseModelConfig &config, Nnet *nnet)
This function modifies the neural net for efficiency, in a way that suitable to be done in test time...
Definition: nnet-utils.cc:2100

kaldi::nnet3::ComputationRequest::store_component_stats
bool store_component_stats
you should set need_component_stats to true if you need the average-activation and average-derivative...
Definition: nnet-computation.h:126

kaldi::nnet3::BatchedXvectorComputer::xvector_dim_
int32 xvector_dim_
Definition: nnet3-xvector-compute-batched.cc:235

kaldi::nnet3::BatchedXvectorComputer::Flush
void Flush()
Calling this will force any partial minibatch to be computed, so that any utterances that have previo...
Definition: nnet3-xvector-compute-batched.cc:397

kaldi::nnet3::ComputationRequest::need_model_derivative
bool need_model_derivative
if need_model_derivative is true, then we&#39;ll be doing either model training or model-derivative compu...
Definition: nnet-computation.h:121

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::nnet3::DivideIntoPieces
void DivideIntoPieces(int32 a, int32 b, std::vector< int32 > *pieces)
This function divides the number &#39;a&#39; into &#39;b&#39; pieces, such that the sum of the pieces equals &#39;a&#39; and ...
Definition: nnet3-xvector-compute-batched.cc:72

kaldi::nnet3::BatchedXvectorComputer::AddChunkToBatch
void AddChunkToBatch(XvectorTask *task, const Matrix< BaseFloat > &input, int32 chunk_start)
Adds a new chunk to a batch we are preparing.
Definition: nnet3-xvector-compute-batched.cc:352

kaldi::nnet3::BatchedXvectorComputer
Definition: nnet3-xvector-compute-batched.cc:99

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::nnet3::BatchedXvectorComputerOptions::compiler_config
CachingOptimizingCompilerOptions compiler_config
Definition: nnet3-xvector-compute-batched.cc:40

kaldi::SequentialTableReader::Key
std::string Key()
Definition: kaldi-table-inl.h:918

kaldi::nnet3::BatchedXvectorComputerOptions::optimize_config
NnetOptimizeOptions optimize_config
Definition: nnet3-xvector-compute-batched.cc:39

kaldi::nnet3::CachingOptimizingCompiler
This class enables you to do the compilation and optimization in one call, and also ensures that if t...
Definition: nnet-optimize.h:219

kaldi::nnet3::BatchedXvectorComputer::computation_
std::shared_ptr< const NnetComputation > computation_
The compiled computation (will be the same for every batch).
Definition: nnet3-xvector-compute-batched.cc:248

kaldi::nnet3::BatchedXvectorComputer::input_feats_
Matrix< BaseFloat > input_feats_
Staging area for the input features prior to copying them to GPU.
Definition: nnet3-xvector-compute-batched.cc:244

kaldi::nnet3::CachingOptimizingCompilerOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-optimize.h:200

kaldi::nnet3::BatchedXvectorComputer::CreateTask
XvectorTask * CreateTask(const std::string &utt, int32 num_chunks)
This adds a newly created XvectorTask at the tail of the singly linked list whose (head...
Definition: nnet3-xvector-compute-batched.cc:275

kaldi::nnet3::SetBatchnormTestMode
void SetBatchnormTestMode(bool test_mode, Nnet *nnet)
This function affects only components of type BatchNormComponent.
Definition: nnet-utils.cc:564

kaldi::TableWriter
A templated class for writing objects to an archive or script file; see The Table concept...
Definition: kaldi-table.h:368

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::BatchedXvectorComputer::results_head_
XvectorTask * results_head_
Definition: nnet3-xvector-compute-batched.cc:268

common-utils.h

kaldi::Matrix< BaseFloat >

kaldi::nnet3::ComputationRequest::inputs
std::vector< IoSpecification > inputs
Definition: nnet-computation.h:115

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet3::BatchedXvectorComputerOptions::chunk_size
int32 chunk_size
Definition: nnet3-xvector-compute-batched.cc:35

kaldi::nnet3::IoSpecification::name
std::string name
Definition: nnet-computation.h:73

kaldi::nnet3::BatchedXvectorComputerOptions::pad_input
bool pad_input
Definition: nnet3-xvector-compute-batched.cc:37

timer.h

kaldi::nnet3::BatchedXvectorComputerOptions::batch_size
int32 batch_size
Definition: nnet3-xvector-compute-batched.cc:36

kaldi::TableWriter::Write
void Write(const std::string &key, const T &value) const
Definition: kaldi-table-inl.h:1511

kaldi::nnet3
Definition: dnn3_code_compilation.dox:22

kaldi::nnet3::Nnet::OutputDim
int32 OutputDim(const std::string &output_name) const
Definition: nnet-nnet.cc:677

kaldi::nnet3::BatchedXvectorComputer::nnet_
const Nnet & nnet_
Definition: nnet3-xvector-compute-batched.cc:232

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi::nnet3::NnetComputeOptions
Definition: nnet-compute.h:39

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

kaldi::ReadKaldiObject
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
Definition: kaldi-io.cc:832

nnet-utils.h
This file contains some miscellaneous functions dealing with class Nnet.

kaldi::nnet3::CachingOptimizingCompilerOptions
Definition: nnet-optimize.h:192

kaldi::nnet3::SetDropoutTestMode
void SetDropoutTestMode(bool test_mode, Nnet *nnet)
This function affects components of child-classes of RandomComponent.
Definition: nnet-utils.cc:573

kaldi::nnet3::NnetComputer::AcceptInput
void AcceptInput(const std::string &node_name, CuMatrix< BaseFloat > *input)
e.g.
Definition: nnet-compute.cc:547

kaldi::VectorBase::CopyFromVec
void CopyFromVec(const VectorBase< Real > &v)
Copy data from another vector (must match own size).
Definition: kaldi-vector.cc:228

kaldi::nnet3::BatchedXvectorComputer::XvectorTask::utt_id
std::string utt_id
Definition: nnet3-xvector-compute-batched.cc:155

kaldi::nnet3::BatchedXvectorComputer::OutputXvector
void OutputXvector(std::string *utt, Vector< BaseFloat > *xvector)
This function, which must only be called if XvectorReady() has just returned true, outputs an xvector for an utterance.
Definition: nnet3-xvector-compute-batched.cc:385

kaldi::nnet3::Index::n
int32 n
Definition: nnet-common.h:45

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::nnet3::BatchedXvectorComputer::XvectorTask::xvector
Vector< BaseFloat > xvector
Definition: nnet3-xvector-compute-batched.cc:158

kaldi::nnet3::BatchedXvectorComputer::ComputeOneBatch
void ComputeOneBatch()
Does the nnet computation for one batch and distributes the computed x-vectors (of chunks) appropriat...
Definition: nnet3-xvector-compute-batched.cc:404

kaldi::nnet3::BatchedXvectorComputer::AcceptUtterance
void AcceptUtterance(const std::string &utt, const Matrix< BaseFloat > &input)
Accepts an utterance to process into an xvector, and, if one or more batches become full...
Definition: nnet3-xvector-compute-batched.cc:428

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

kaldi::nnet3::BatchedXvectorComputer::tasks_this_batch_
std::vector< XvectorTask * > tasks_this_batch_
tasks_this_batch_ is of dimension opts_.batch_size.
Definition: nnet3-xvector-compute-batched.cc:262

float

kaldi::nnet3::ComputeSimpleNnetContext
void ComputeSimpleNnetContext(const Nnet &nnet, int32 *left_context, int32 *right_context)
ComputeSimpleNnetContext computes the left-context and right-context of a nnet.
Definition: nnet-utils.cc:146

kaldi::nnet3::BatchedXvectorComputer::XvectorTask::num_chunks_finished
int32 num_chunks_finished
Definition: nnet3-xvector-compute-batched.cc:157

kaldi::Vector::Swap
void Swap(Vector< Real > *other)
Swaps the contents of *this and *other. Shallow swap.
Definition: kaldi-vector.cc:1297

rnnlm::n
struct rnnlm::@11::@12 n

kaldi::nnet3::NnetOptimizeOptions
Definition: nnet-optimize.h:35

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::nnet3::BatchedXvectorComputer::BatchedXvectorComputer
BatchedXvectorComputer(const BatchedXvectorComputerOptions &opts, const Nnet &nnet, int32 total_context)
Definition: nnet3-xvector-compute-batched.cc:293

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::nnet3::BatchedXvectorComputerOptions::Register
void Register(OptionsItf *po)
Definition: nnet3-xvector-compute-batched.cc:43

kaldi::nnet3::BatchedXvectorComputer::opts_
const BatchedXvectorComputerOptions & opts_
Definition: nnet3-xvector-compute-batched.cc:230

kaldi::Timer
Definition: timer.h:63

kaldi::nnet3::IoSpecification
Definition: nnet-computation.h:72

kaldi::nnet3::IoSpecification::has_deriv
bool has_deriv
Definition: nnet-computation.h:75

kaldi::nnet3::BatchedXvectorComputer::XvectorTask::num_chunks
int32 num_chunks
Definition: nnet3-xvector-compute-batched.cc:156

kaldi::nnet3::NnetComputeOptions::Register
void Register(OptionsItf *opts)
Definition: nnet-compute.h:42

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::CachingOptimizingCompiler::Compile
std::shared_ptr< const NnetComputation > Compile(const ComputationRequest &request)
Does the compilation and returns a const pointer to the result, which is owned by this class...
Definition: nnet-optimize.cc:716

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

kaldi::nnet3::IoSpecification::indexes
std::vector< Index > indexes
Definition: nnet-computation.h:74

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::nnet3::NnetComputer
class NnetComputer is responsible for executing the computation described in the "computation" object...
Definition: nnet-compute.h:59

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

kaldi::nnet3::BatchedXvectorComputer::position_in_batch_
int32 position_in_batch_
position_in_batch_ is the number of chunks that we have filled in in the input_feats_ matrix and task...
Definition: nnet3-xvector-compute-batched.cc:255

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet3::ComputationRequest::outputs
std::vector< IoSpecification > outputs
Definition: nnet-computation.h:116

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::nnet3::SetRequireDirectInput
void SetRequireDirectInput(bool b, Nnet *nnet)
Calls the corresponding function in any component of type StatisticsPoolingComponent; used as a way t...
Definition: nnet-utils.cc:303

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::nnet3::BatchedXvectorComputer::total_context_
int32 total_context_
Definition: nnet3-xvector-compute-batched.cc:231

kaldi::nnet3::BatchedXvectorComputerOptions::compute_config
NnetComputeOptions compute_config
Definition: nnet3-xvector-compute-batched.cc:38

kaldi::nnet3::Index::t
int32 t
Definition: nnet-common.h:46

kaldi::nnet3::NnetComputer::GetOutputDestructive
void GetOutputDestructive(const std::string &output_name, CuMatrix< BaseFloat > *output)
Definition: nnet-compute.cc:587

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::nnet3::BatchedXvectorComputer::results_tail_
XvectorTask * results_tail_
Definition: nnet3-xvector-compute-batched.cc:271

kaldi::nnet3::BatchedXvectorComputerOptions
Definition: nnet3-xvector-compute-batched.cc:34

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::nnet3::BatchedXvectorComputer::feature_dim_
int32 feature_dim_
Definition: nnet3-xvector-compute-batched.cc:234

kaldi::Timer::Elapsed
double Elapsed() const
Returns time in seconds.
Definition: timer.h:74

kaldi-common.h

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501

nnet-am-decodable-simple.h

kaldi::nnet3::BatchedXvectorComputer::SplitUtteranceIntoChunks
void SplitUtteranceIntoChunks(int32 num_frames, std::vector< int32 > *start_frames)
This decides how to split the utterance into chunks.
Definition: nnet3-xvector-compute-batched.cc:445

kaldi::nnet3::BatchedXvectorComputer::XvectorTask::tail
XvectorTask * tail
Definition: nnet3-xvector-compute-batched.cc:159

main
int main(int argc, char *argv[])
Definition: nnet3-xvector-compute-batched.cc:524

kaldi::nnet3::BatchedXvectorComputer::XvectorReady
bool XvectorReady() const
Returns true if at least one xvector is pending output (i.e.
Definition: nnet3-xvector-compute-batched.cc:378

kaldi::nnet3::CollapseModelConfig
Config class for the CollapseModel function.
Definition: nnet-utils.h:240

kaldi::nnet3::BatchedXvectorComputer::XvectorTask
Definition: nnet3-xvector-compute-batched.cc:154

kaldi::nnet3::NnetComputer::Run
void Run()
This does either the forward or backward computation, depending when it is called (in a typical compu...
Definition: nnet-compute.cc:512