doc/nnet-chain-example_8cc_source.html

 // nnet3/nnet-chain-example.cc

 // Copyright      2015    Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <cmath>
 #include "nnet3/nnet-chain-example.h"
 #include "nnet3/nnet-example-utils.h"

 namespace kaldi {
 namespace nnet3 {


 void NnetChainSupervision::Write(std::ostream &os, bool binary) const {
   CheckDim();
   WriteToken(os, binary, "<NnetChainSup>");
   WriteToken(os, binary, name);
   WriteIndexVector(os, binary, indexes);
   supervision.Write(os, binary);
   WriteToken(os, binary, "<DW2>");
   deriv_weights.Write(os, binary);
   WriteToken(os, binary, "</NnetChainSup>");
 }

 bool NnetChainSupervision::operator == (const NnetChainSupervision &other) const {
   return name == other.name && indexes == other.indexes &&
       supervision == other.supervision &&
       deriv_weights.ApproxEqual(other.deriv_weights);
 }

 void NnetChainSupervision::Read(std::istream &is, bool binary) {
   ExpectToken(is, binary, "<NnetChainSup>");
   ReadToken(is, binary, &name);
   ReadIndexVector(is, binary, &indexes);
   supervision.Read(is, binary);
   std::string token;
   ReadToken(is, binary, &token);
   // in the future this back-compatibility code can be reworked.
   if (token != "</NnetChainSup>") {
     KALDI_ASSERT(token == "<DW>" || token == "<DW2>");
     if (token == "<DW>")
       ReadVectorAsChar(is, binary, &deriv_weights);
     else
       deriv_weights.Read(is, binary);
     ExpectToken(is, binary, "</NnetChainSup>");
   }
   CheckDim();
 }


 void NnetChainSupervision::CheckDim() const {
   if (supervision.frames_per_sequence == -1) {
     // this object has not been set up.
     KALDI_ASSERT(indexes.empty());
     return;
   }
   KALDI_ASSERT(indexes.size() == supervision.num_sequences *
                supervision.frames_per_sequence && !indexes.empty() &&
                supervision.frames_per_sequence > 1);
   int32 first_frame = indexes[0].t,
       frame_skip = indexes[supervision.num_sequences].t - first_frame,
       num_sequences = supervision.num_sequences,
       frames_per_sequence = supervision.frames_per_sequence;
   int32 k = 0;
   for (int32 i = 0; i < frames_per_sequence; i++) {
     for (int32 j = 0; j < num_sequences; j++,k++) {
       int32 n = j, t = i * frame_skip + first_frame, x = 0;
       Index index(n, t, x);
       KALDI_ASSERT(indexes[k] == index);
     }
   }
   if (deriv_weights.Dim() != 0) {
     KALDI_ASSERT(deriv_weights.Dim() == indexes.size());
     KALDI_ASSERT(deriv_weights.Min() >= 0.0);
   }
 }

 NnetChainSupervision::NnetChainSupervision(const NnetChainSupervision &other):
     name(other.name),
     indexes(other.indexes),
     supervision(other.supervision),
     deriv_weights(other.deriv_weights) { CheckDim(); }

 void NnetChainSupervision::Swap(NnetChainSupervision *other) {
   name.swap(other->name);
   indexes.swap(other->indexes);
   supervision.Swap(&(other->supervision));
   deriv_weights.Swap(&(other->deriv_weights));
   if (RandInt(0, 5) == 0)
     CheckDim();
 }

 NnetChainSupervision::NnetChainSupervision(
     const std::string &name,
     const chain::Supervision &supervision,
     const VectorBase<BaseFloat> &deriv_weights,
     int32 first_frame,
     int32 frame_skip):
     name(name),
     supervision(supervision),
     deriv_weights(deriv_weights) {
   // note: this will set the 'x' index to zero.
   indexes.resize(supervision.num_sequences *
                  supervision.frames_per_sequence);
   int32 k = 0, num_sequences = supervision.num_sequences,
       frames_per_sequence = supervision.frames_per_sequence;
   for (int32 i = 0; i < frames_per_sequence; i++) {
     for (int32 j = 0; j < num_sequences; j++,k++) {
       indexes[k].n = j;
       indexes[k].t = i * frame_skip + first_frame;
     }
   }
   KALDI_ASSERT(k == indexes.size());
   CheckDim();
 }


 void NnetChainExample::Write(std::ostream &os, bool binary) const {
   // Note: weight, label, input_frames and spk_info are members.  This is a
   // struct.
   WriteToken(os, binary, "<Nnet3ChainEg>");
   WriteToken(os, binary, "<NumInputs>");
   int32 size = inputs.size();
   WriteBasicType(os, binary, size);
   KALDI_ASSERT(size > 0 && "Attempting to write NnetChainExample with no inputs");
   if (!binary) os << '\n';
   for (int32 i = 0; i < size; i++) {
     inputs[i].Write(os, binary);
     if (!binary) os << '\n';
   }
   WriteToken(os, binary, "<NumOutputs>");
   size = outputs.size();
   WriteBasicType(os, binary, size);
   KALDI_ASSERT(size > 0 && "Attempting to write NnetChainExample with no outputs");
   if (!binary) os << '\n';
   for (int32 i = 0; i < size; i++) {
     outputs[i].Write(os, binary);
     if (!binary) os << '\n';
   }
   WriteToken(os, binary, "</Nnet3ChainEg>");
 }

 void NnetChainExample::Read(std::istream &is, bool binary) {
   ExpectToken(is, binary, "<Nnet3ChainEg>");
   ExpectToken(is, binary, "<NumInputs>");
   int32 size;
   ReadBasicType(is, binary, &size);
   if (size < 1 || size > 1000000)
     KALDI_ERR << "Invalid size " << size;
   inputs.resize(size);
   for (int32 i = 0; i < size; i++)
     inputs[i].Read(is, binary);
   ExpectToken(is, binary, "<NumOutputs>");
   ReadBasicType(is, binary, &size);
   if (size < 1 || size > 1000000)
     KALDI_ERR << "Invalid size " << size;
   outputs.resize(size);
   for (int32 i = 0; i < size; i++)
     outputs[i].Read(is, binary);
   ExpectToken(is, binary, "</Nnet3ChainEg>");
 }

 void NnetChainExample::Swap(NnetChainExample *other) {
   inputs.swap(other->inputs);
   outputs.swap(other->outputs);
 }

 void NnetChainExample::Compress() {
   std::vector<NnetIo>::iterator iter = inputs.begin(), end = inputs.end();
   // calling features.Compress() will do nothing if they are sparse or already
   // compressed.
   for (; iter != end; ++iter) iter->features.Compress();
 }

 NnetChainExample::NnetChainExample(const NnetChainExample &other):
     inputs(other.inputs), outputs(other.outputs) { }


 // called from MergeChainExamplesInternal, this function merges the Supervision
 // objects into one.  Requires (and checks) that they all have the same name.
 static void MergeSupervision(
     const std::vector<const NnetChainSupervision*> &inputs,
     NnetChainSupervision *output) {
   int32 num_inputs = inputs.size(),
       num_indexes = 0;
   for (int32 n = 0; n < num_inputs; n++) {
     KALDI_ASSERT(inputs[n]->name == inputs[0]->name);
     num_indexes += inputs[n]->indexes.size();
   }
   output->name = inputs[0]->name;
   std::vector<const chain::Supervision*> input_supervision;
   input_supervision.reserve(inputs.size());
   for (int32 n = 0; n < num_inputs; n++)
     input_supervision.push_back(&(inputs[n]->supervision));
   chain::Supervision output_supervision;
   MergeSupervision(input_supervision,
                    &output_supervision);
   output->supervision.Swap(&output_supervision);

   output->indexes.clear();
   output->indexes.reserve(num_indexes);
   for (int32 n = 0; n < num_inputs; n++) {
     const std::vector<Index> &src_indexes = inputs[n]->indexes;
     int32 cur_size = output->indexes.size();
     output->indexes.insert(output->indexes.end(),
                            src_indexes.begin(), src_indexes.end());
     std::vector<Index>::iterator iter = output->indexes.begin() + cur_size,
         end = output->indexes.end();
     // change the 'n' index to correspond to the index into 'input'.
     // Each example gets a different 'n' value, starting from 0.
     for (; iter != end; ++iter) {
       KALDI_ASSERT(iter->n == 0 && "Merging already-merged chain egs");
       iter->n = n;
     }
   }
   KALDI_ASSERT(output->indexes.size() == num_indexes);
   // OK, at this point the 'indexes' will be in the wrong order,
   // because they should be first sorted by 't' and next by 'n'.
   // 'sort' will fix this, due to the operator < on type Index.
   std::sort(output->indexes.begin(), output->indexes.end());

   // merge the deriv_weights.
   if (inputs[0]->deriv_weights.Dim() != 0) {
     int32 frames_per_sequence = inputs[0]->deriv_weights.Dim();
     output->deriv_weights.Resize(output->indexes.size(), kUndefined);
     KALDI_ASSERT(output->deriv_weights.Dim() ==
                  frames_per_sequence * num_inputs);
     for (int32 n = 0; n < num_inputs; n++) {
       const Vector<BaseFloat> &src_deriv_weights = inputs[n]->deriv_weights;
       KALDI_ASSERT(src_deriv_weights.Dim() == frames_per_sequence);
       // the ordering of the deriv_weights corresponds to the ordering of the
       // Indexes, where the time dimension has the greater stride.
       for (int32 t = 0; t < frames_per_sequence; t++) {
         output->deriv_weights(t * num_inputs + n) = src_deriv_weights(t);
       }
     }
   }
   output->CheckDim();
 }


 void MergeChainExamples(bool compress,
                         std::vector<NnetChainExample> *input,
                         NnetChainExample *output) {
   int32 num_examples = input->size();
   KALDI_ASSERT(num_examples > 0);
   // we temporarily make the input-features in 'input' look like regular NnetExamples,
   // so that we can recycle the MergeExamples() function.
   std::vector<NnetExample> eg_inputs(num_examples);
   for (int32 i = 0; i < num_examples; i++)
     eg_inputs[i].io.swap((*input)[i].inputs);
   NnetExample eg_output;
   MergeExamples(eg_inputs, compress, &eg_output);
   // swap the inputs back so that they are not really changed.
   for (int32 i = 0; i < num_examples; i++)
     eg_inputs[i].io.swap((*input)[i].inputs);
   // write to 'output->inputs'
   eg_output.io.swap(output->inputs);

   // Now deal with the chain-supervision 'outputs'.  There will
   // normally be just one of these, with name "output", but we
   // handle the more general case.
   int32 num_output_names = (*input)[0].outputs.size();
   output->outputs.resize(num_output_names);
   for (int32 i = 0; i < num_output_names; i++) {
     std::vector<const NnetChainSupervision*> to_merge(num_examples);
     for (int32 j = 0; j < num_examples; j++) {
       KALDI_ASSERT((*input)[j].outputs.size() == num_output_names);
       to_merge[j] = &((*input)[j].outputs[i]);
     }
     MergeSupervision(to_merge,
                      &(output->outputs[i]));
   }
 }

 void GetChainComputationRequest(const Nnet &nnet,
                                 const NnetChainExample &eg,
                                 bool need_model_derivative,
                                 bool store_component_stats,
                                 bool use_xent_regularization,
                                 bool use_xent_derivative,
                                 ComputationRequest *request) {
   request->inputs.clear();
   request->inputs.reserve(eg.inputs.size());
   request->outputs.clear();
   request->outputs.reserve(eg.outputs.size() * 2);
   request->need_model_derivative = need_model_derivative;
   request->store_component_stats = store_component_stats;
   for (size_t i = 0; i < eg.inputs.size(); i++) {
     const NnetIo &io = eg.inputs[i];
     const std::string &name = io.name;
     int32 node_index = nnet.GetNodeIndex(name);
     if (node_index == -1 ||
         !nnet.IsInputNode(node_index))
       KALDI_ERR << "Nnet example has input named '" << name
                 << "', but no such input node is in the network.";

     request->inputs.resize(request->inputs.size() + 1);
     IoSpecification &io_spec = request->inputs.back();
     io_spec.name = name;
     io_spec.indexes = io.indexes;
     io_spec.has_deriv = false;
   }
   for (size_t i = 0; i < eg.outputs.size(); i++) {
     // there will normally be exactly one output , named "output"
     const NnetChainSupervision &sup = eg.outputs[i];
     const std::string &name = sup.name;
     int32 node_index = nnet.GetNodeIndex(name);
     if (node_index == -1 &&
         !nnet.IsOutputNode(node_index))
       KALDI_ERR << "Nnet example has output named '" << name
                 << "', but no such output node is in the network.";
     request->outputs.resize(request->outputs.size() + 1);
     IoSpecification &io_spec = request->outputs.back();
     io_spec.name = name;
     io_spec.indexes = sup.indexes;
     io_spec.has_deriv = need_model_derivative;

     if (use_xent_regularization) {
       size_t cur_size = request->outputs.size();
       request->outputs.resize(cur_size + 1);
       IoSpecification &io_spec = request->outputs[cur_size - 1],
           &io_spec_xent = request->outputs[cur_size];
       // the IoSpecification for the -xent output is the same
       // as for the regular output, except for its name which has
       // the -xent suffix (and the has_deriv member may differ).
       io_spec_xent = io_spec;
       io_spec_xent.name = name + "-xent";
       io_spec_xent.has_deriv = use_xent_derivative;
     }
   }
   // check to see if something went wrong.
   if (request->inputs.empty())
     KALDI_ERR << "No inputs in computation request.";
   if (request->outputs.empty())
     KALDI_ERR << "No outputs in computation request.";
 }

 void ShiftChainExampleTimes(int32 frame_shift,
                             const std::vector<std::string> &exclude_names,
                             NnetChainExample *eg) {
   std::vector<NnetIo>::iterator input_iter = eg->inputs.begin(),
       input_end = eg->inputs.end();
   for (; input_iter != input_end; ++input_iter) {
     bool must_exclude = false;
     std::vector<std::string>::const_iterator exclude_iter = exclude_names.begin(),
         exclude_end = exclude_names.end();
     for (; exclude_iter != exclude_end; ++exclude_iter)
       if (input_iter->name == *exclude_iter)
         must_exclude = true;
     if (!must_exclude) {
       std::vector<Index>::iterator indexes_iter = input_iter->indexes.begin(),
           indexes_end = input_iter->indexes.end();
       for (; indexes_iter != indexes_end; ++indexes_iter)
         indexes_iter->t += frame_shift;
     }
   }
   // note: we'll normally choose a small enough shift that the output-data
   // shift will be zero after dividing by frame_subsampling_factor
   // (e.g. frame_subsampling_factor == 3 and shift = 0 or 1.
   std::vector<NnetChainSupervision>::iterator
       sup_iter = eg->outputs.begin(),
       sup_end = eg->outputs.end();
   for (; sup_iter != sup_end; ++sup_iter) {
     std::vector<Index> &indexes = sup_iter->indexes;
     KALDI_ASSERT(indexes.size() >= 2 && indexes[0].n == indexes[1].n &&
                  indexes[0].x == indexes[1].x);
     int32 frame_subsampling_factor = indexes[1].t - indexes[0].t;
     KALDI_ASSERT(frame_subsampling_factor > 0);

     // We need to shift by a multiple of frame_subsampling_factor.
     // Round to the closest multiple.
     int32 supervision_frame_shift =
         frame_subsampling_factor *
         std::floor(0.5 + (frame_shift * 1.0 / frame_subsampling_factor));
     if (supervision_frame_shift == 0)
       continue;
     std::vector<Index>::iterator indexes_iter = indexes.begin(),
         indexes_end = indexes.end();
     for (; indexes_iter != indexes_end; ++indexes_iter)
       indexes_iter->t += supervision_frame_shift;
   }
 }


 size_t NnetChainExampleStructureHasher::operator () (
     const NnetChainExample &eg) const noexcept {
   // these numbers were chosen at random from a list of primes.
   NnetIoStructureHasher io_hasher;
   size_t size = eg.inputs.size(), ans = size * 35099;
   for (size_t i = 0; i < size; i++)
     ans = ans * 19157 + io_hasher(eg.inputs[i]);
   for (size_t i = 0; i < eg.outputs.size(); i++) {
     const NnetChainSupervision &sup = eg.outputs[i];
     StringHasher string_hasher;
     IndexVectorHasher indexes_hasher;
     ans = ans * 17957 +
         string_hasher(sup.name) + indexes_hasher(sup.indexes);
   }
   return ans;
 }

 bool NnetChainExampleStructureCompare::operator () (
     const NnetChainExample &a,
     const NnetChainExample &b) const {
   NnetIoStructureCompare io_compare;
   if (a.inputs.size() != b.inputs.size() ||
       a.outputs.size() != b.outputs.size())
     return false;
   size_t size = a.inputs.size();
   for (size_t i = 0; i < size; i++)
     if (!io_compare(a.inputs[i], b.inputs[i]))
       return false;
   size = a.outputs.size();
   for (size_t i = 0; i < size; i++)
     if (a.outputs[i].name != b.outputs[i].name ||
         a.outputs[i].indexes != b.outputs[i].indexes)
       return false;
   return true;
 }


 int32 GetNnetChainExampleSize(const NnetChainExample &a) {
   int32 ans = 0;
   for (size_t i = 0; i < a.inputs.size(); i++) {
     int32 s = a.inputs[i].indexes.size();
     if (s > ans)
       ans = s;
   }
   for (size_t i = 0; i < a.outputs.size(); i++) {
     int32 s = a.outputs[i].indexes.size();
     if (s > ans)
       ans = s;
   }
   return ans;
 }


 ChainExampleMerger::ChainExampleMerger(const ExampleMergingConfig &config,
                                        NnetChainExampleWriter *writer):
     finished_(false), num_egs_written_(0),
     config_(config), writer_(writer) { }


 void ChainExampleMerger::AcceptExample(NnetChainExample *eg) {
   KALDI_ASSERT(!finished_);
   // If an eg with the same structure as 'eg' is already a key in the
   // map, it won't be replaced, but if it's new it will be made
   // the key.  Also we remove the key before making the vector empty.
   // This way we ensure that the eg in the key is always the first
   // element of the vector.
   std::vector<NnetChainExample*> &vec = eg_to_egs_[eg];
   vec.push_back(eg);
   int32 eg_size = GetNnetChainExampleSize(*eg),
       num_available = vec.size();
   bool input_ended = false;
   int32 minibatch_size = config_.MinibatchSize(eg_size, num_available,
                                                input_ended);
   if (minibatch_size != 0) {  // we need to write out a merged eg.
     KALDI_ASSERT(minibatch_size == num_available);

     std::vector<NnetChainExample*> vec_copy(vec);
     eg_to_egs_.erase(eg);

     // MergeChainExamples() expects a vector of NnetChainExample, not of pointers,
     // so use swap to create that without doing any real work.
     std::vector<NnetChainExample> egs_to_merge(minibatch_size);
     for (int32 i = 0; i < minibatch_size; i++) {
       egs_to_merge[i].Swap(vec_copy[i]);
       delete vec_copy[i];  // we owned those pointers.
     }
     WriteMinibatch(&egs_to_merge);
   }
 }

 void ChainExampleMerger::WriteMinibatch(
     std::vector<NnetChainExample> *egs) {
   KALDI_ASSERT(!egs->empty());
   int32 eg_size = GetNnetChainExampleSize((*egs)[0]);
   NnetChainExampleStructureHasher eg_hasher;
   size_t structure_hash = eg_hasher((*egs)[0]);
   int32 minibatch_size = egs->size();
   stats_.WroteExample(eg_size, structure_hash, minibatch_size);
   NnetChainExample merged_eg;
   MergeChainExamples(config_.compress, egs, &merged_eg);
   std::ostringstream key;
   key << "merged-" << (num_egs_written_++) << "-" << minibatch_size;
   writer_->Write(key.str(), merged_eg);
 }

 void ChainExampleMerger::Finish() {
   if (finished_) return;  // already finished.
   finished_ = true;

   // we'll convert the map eg_to_egs_ to a vector of vectors to avoid
   // iterator invalidation problems.
   std::vector<std::vector<NnetChainExample*> > all_egs;
   all_egs.reserve(eg_to_egs_.size());

   MapType::iterator iter = eg_to_egs_.begin(), end = eg_to_egs_.end();
   for (; iter != end; ++iter)
     all_egs.push_back(iter->second);
   eg_to_egs_.clear();

   for (size_t i = 0; i < all_egs.size(); i++) {
     int32 minibatch_size;
     std::vector<NnetChainExample*> &vec = all_egs[i];
     KALDI_ASSERT(!vec.empty());
     int32 eg_size = GetNnetChainExampleSize(*(vec[0]));
     bool input_ended = true;
     while (!vec.empty() &&
            (minibatch_size = config_.MinibatchSize(eg_size, vec.size(),
                                                    input_ended)) != 0) {
       // MergeChainExamples() expects a vector of
       // NnetChainExample, not of pointers, so use swap to create that
       // without doing any real work.
       std::vector<NnetChainExample> egs_to_merge(minibatch_size);
       for (int32 i = 0; i < minibatch_size; i++) {
         egs_to_merge[i].Swap(vec[i]);
         delete vec[i];  // we owned those pointers.
       }
       vec.erase(vec.begin(), vec.begin() + minibatch_size);
       WriteMinibatch(&egs_to_merge);
     }
     if (!vec.empty()) {
       int32 eg_size = GetNnetChainExampleSize(*(vec[0]));
       NnetChainExampleStructureHasher eg_hasher;
       size_t structure_hash = eg_hasher(*(vec[0]));
       int32 num_discarded = vec.size();
       stats_.DiscardedExamples(eg_size, structure_hash, num_discarded);
       for (int32 i = 0; i < num_discarded; i++)
         delete vec[i];
       vec.clear();
     }
   }
   stats_.PrintStats();
 }


 } // namespace nnet3
 } // namespace kaldi
kaldi::nnet3::NnetExample
NnetExample is the input data and corresponding label (or labels) for one or more frames of input...
Definition: nnet-example.h:111

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::NnetIo
Definition: nnet-example.h:33

kaldi::nnet3::ExampleMergingConfig::compress
bool compress
Definition: nnet-example-utils.h:324

kaldi::nnet3::WriteIndexVector
void WriteIndexVector(std::ostream &os, bool binary, const std::vector< Index > &vec)
Definition: nnet-common.cc:126

kaldi::nnet3::NnetChainSupervision::deriv_weights
Vector< BaseFloat > deriv_weights
This is a vector of per-frame weights, required to be between 0 and 1, that is applied to the derivat...
Definition: nnet-chain-example.h:77

kaldi::nnet3::ExampleMergingStats::DiscardedExamples
void DiscardedExamples(int32 example_size, size_t structure_hash, int32 num_discarded)
Users call this function to inform this class that after processing all the data, for examples of ori...
Definition: nnet-example-utils.cc:1065

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::nnet3::ComputationRequest::store_component_stats
bool store_component_stats
you should set need_component_stats to true if you need the average-activation and average-derivative...
Definition: nnet-computation.h:126

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::ComputationRequest::need_model_derivative
bool need_model_derivative
if need_model_derivative is true, then we&#39;ll be doing either model training or model-derivative compu...
Definition: nnet-computation.h:121

kaldi::nnet3::IndexVectorHasher
Definition: nnet-common.h:131

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet3::NnetChainSupervision::supervision
chain::Supervision supervision
The supervision object, containing the FST.
Definition: nnet-chain-example.h:64

kaldi::nnet3::NnetChainExample::inputs
std::vector< NnetIo > inputs
&#39;inputs&#39; contains the input to the network– normally just it has just one element called "input"...
Definition: nnet-chain-example.h:115

kaldi::nnet3::MergeChainExamples
void MergeChainExamples(bool compress, std::vector< NnetChainExample > *input, NnetChainExample *output)
This function merges a list of NnetChainExample objects into a single one– intended to be used when ...
Definition: nnet-chain-example.cc:256

kaldi::nnet3::ShiftChainExampleTimes
void ShiftChainExampleTimes(int32 frame_shift, const std::vector< std::string > &exclude_names, NnetChainExample *eg)
Shifts the time-index t of everything in the input of "eg" by adding "t_offset" to all "t" values– b...
Definition: nnet-chain-example.cc:353

kaldi::nnet3::Nnet::IsInputNode
bool IsInputNode(int32 node) const
Returns true if this is an output node, meaning that it is of type kInput.
Definition: nnet-nnet.cc:120

kaldi::nnet3::MergeSupervision
static void MergeSupervision(const std::vector< const NnetChainSupervision *> &inputs, NnetChainSupervision *output)
Definition: nnet-chain-example.cc:195

kaldi::nnet3::ExampleMergingConfig::MinibatchSize
int32 MinibatchSize(int32 size_of_eg, int32 num_available_egs, bool input_ended) const
This function tells you what minibatch size should be used for this eg.
Definition: nnet-example-utils.cc:1017

kaldi::TableWriter
A templated class for writing objects to an archive or script file; see The Table concept...
Definition: kaldi-table.h:368

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet3::NnetChainExample::NnetChainExample
NnetChainExample()
Definition: nnet-chain-example.h:129

kaldi::nnet3::ComputationRequest::inputs
std::vector< IoSpecification > inputs
Definition: nnet-computation.h:115

kaldi::nnet3::NnetIo::indexes
std::vector< Index > indexes
"indexes" is a vector the same length as features.NumRows(), explaining the meaning of each row of th...
Definition: nnet-example.h:42

kaldi::nnet3::IoSpecification::name
std::string name
Definition: nnet-computation.h:73

kaldi::nnet3::NnetChainSupervision::Write
void Write(std::ostream &os, bool binary) const
Definition: nnet-chain-example.cc:28

kaldi::nnet3::NnetChainSupervision::Swap
void Swap(NnetChainSupervision *other)
Definition: nnet-chain-example.cc:98

kaldi::StringHasher
A hashing function object for strings.
Definition: stl-utils.h:248

kaldi::nnet3::NnetChainSupervision::name
std::string name
the name of the output in the neural net; in simple setups it will just be "output".
Definition: nnet-chain-example.h:46

kaldi::TableWriter::Write
void Write(const std::string &key, const T &value) const
Definition: kaldi-table-inl.h:1511

kaldi::nnet3::ChainExampleMerger::finished_
bool finished_
Definition: nnet-chain-example.h:262

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

kaldi::nnet3::ExampleMergingConfig
Definition: nnet-example-utils.h:321

kaldi::nnet3::GetNnetChainExampleSize
int32 GetNnetChainExampleSize(const NnetChainExample &a)
Definition: nnet-chain-example.cc:437

kaldi::nnet3::NnetChainExampleStructureCompare::operator()
bool operator()(const NnetChainExample &a, const NnetChainExample &b) const
Definition: nnet-chain-example.cc:417

kaldi::nnet3::ChainExampleMerger::Finish
void Finish()
Definition: nnet-chain-example.cc:505

kaldi::nnet3::NnetChainSupervision::NnetChainSupervision
NnetChainSupervision()
Definition: nnet-chain-example.h:81

kaldi::nnet3::ExampleMergingStats::PrintStats
void PrintStats() const
Calling this will cause a log message with information about the examples to be printed.
Definition: nnet-example-utils.cc:1073

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::nnet3::NnetChainExampleStructureHasher
This hashing object hashes just the structural aspects of the NnetExample without looking at the valu...
Definition: nnet-chain-example.h:141

kaldi::nnet3::NnetChainSupervision::CheckDim
void CheckDim() const
Definition: nnet-chain-example.cc:65

kaldi::nnet3::Nnet::IsOutputNode
bool IsOutputNode(int32 node) const
Returns true if this is an output node, meaning that it is of type kDescriptor and is not directly fo...
Definition: nnet-nnet.cc:112

kaldi::nnet3::ExpectToken
static void ExpectToken(const std::string &token, const std::string &what_we_are_parsing, const std::string **next_token)
Definition: nnet-descriptor.cc:45

kaldi::nnet3::NnetChainExample::outputs
std::vector< NnetChainSupervision > outputs
&#39;outputs&#39; contains the chain output supervision.
Definition: nnet-chain-example.h:119

kaldi::nnet3::ChainExampleMerger::ChainExampleMerger
ChainExampleMerger(const ExampleMergingConfig &config, NnetChainExampleWriter *writer)
Definition: nnet-chain-example.cc:453

rnnlm::n
struct rnnlm::@11::@12 n

kaldi::nnet3::NnetChainSupervision::Read
void Read(std::istream &is, bool binary)
Definition: nnet-chain-example.cc:45

kaldi::nnet3::NnetChainExample
NnetChainExample is like NnetExample, but specialized for lattice-free (chain) training.
Definition: nnet-chain-example.h:110

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

nnet-example-utils.h

kaldi::nnet3::ChainExampleMerger::AcceptExample
void AcceptExample(NnetChainExample *a)
Definition: nnet-chain-example.cc:459

kaldi::nnet3::NnetChainExampleStructureHasher::operator()
size_t operator()(const NnetChainExample &eg) const noexcept
Definition: nnet-chain-example.cc:400

kaldi::nnet3::NnetChainExample::Swap
void Swap(NnetChainExample *other)
Definition: nnet-chain-example.cc:177

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::nnet3::ReadIndexVector
void ReadIndexVector(std::istream &is, bool binary, std::vector< Index > *vec)
Definition: nnet-common.cc:143

kaldi::nnet3::NnetChainExample::Read
void Read(std::istream &is, bool binary)
Definition: nnet-chain-example.cc:157

kaldi::nnet3::ExampleMergingStats::WroteExample
void WroteExample(int32 example_size, size_t structure_hash, int32 minibatch_size)
Users call this function to inform this class that one minibatch has been written aggregating &#39;miniba...
Definition: nnet-example-utils.cc:1051

kaldi::nnet3::ChainExampleMerger::config_
const ExampleMergingConfig & config_
Definition: nnet-chain-example.h:264

kaldi::nnet3::IoSpecification
Definition: nnet-computation.h:72

kaldi::nnet3::ChainExampleMerger::writer_
NnetChainExampleWriter * writer_
Definition: nnet-chain-example.h:265

kaldi::nnet3::IoSpecification::has_deriv
bool has_deriv
Definition: nnet-computation.h:75

kaldi::nnet3::ChainExampleMerger::num_egs_written_
int32 num_egs_written_
Definition: nnet-chain-example.h:263

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::NnetChainSupervision::operator==
bool operator==(const NnetChainSupervision &other) const
Definition: nnet-chain-example.cc:39

kaldi::nnet3::IoSpecification::indexes
std::vector< Index > indexes
Definition: nnet-computation.h:74

kaldi::nnet3::NnetChainExample::Write
void Write(std::ostream &os, bool binary) const
Definition: nnet-chain-example.cc:132

kaldi::nnet3::ChainExampleMerger::stats_
ExampleMergingStats stats_
Definition: nnet-chain-example.h:266

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet3::ComputationRequest::outputs
std::vector< IoSpecification > outputs
Definition: nnet-computation.h:116

kaldi::nnet3::NnetIoStructureCompare
This comparison object compares just the structural aspects of the NnetIo object (name, indexes, feature dimension) without looking at the value of features.
Definition: nnet-example.h:101

kaldi::nnet3::NnetChainSupervision
Definition: nnet-chain-example.h:43

kaldi::nnet3::NnetChainSupervision::indexes
std::vector< Index > indexes
The indexes that the output corresponds to.
Definition: nnet-chain-example.h:60

kaldi::nnet3::NnetIoStructureHasher
This hashing object hashes just the structural aspects of the NnetIo object (name, indexes, feature dimension) without looking at the value of features.
Definition: nnet-example.h:94

kaldi::nnet3::ReadVectorAsChar
void ReadVectorAsChar(std::istream &is, bool binary, Vector< BaseFloat > *vec)
Definition: nnet-example-utils.cc:258

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet3::NnetIo::name
std::string name
the name of the input in the neural net; in simple setups it will just be "input".
Definition: nnet-example.h:36

kaldi::nnet3::ChainExampleMerger::WriteMinibatch
void WriteMinibatch(std::vector< NnetChainExample > *egs)
Definition: nnet-chain-example.cc:490

kaldi::nnet3::Nnet::GetNodeIndex
int32 GetNodeIndex(const std::string &node_name) const
returns index associated with this node name, or -1 if no such index.
Definition: nnet-nnet.cc:466

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::nnet3::GetChainComputationRequest
void GetChainComputationRequest(const Nnet &nnet, const NnetChainExample &eg, bool need_model_derivative, bool store_component_stats, bool use_xent_regularization, bool use_xent_derivative, ComputationRequest *request)
This function takes a NnetChainExample and produces a ComputationRequest.
Definition: nnet-chain-example.cc:290

kaldi::nnet3::NnetExample::io
std::vector< NnetIo > io
"io" contains the input and output.
Definition: nnet-example.h:116

kaldi::nnet3::NnetChainExample::Compress
void Compress()
Definition: nnet-chain-example.cc:182

nnet-chain-example.h

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95

kaldi::nnet3::MergeExamples
void MergeExamples(const std::vector< NnetExample > &src, bool compress, NnetExample *merged_eg)
Merge a set of input examples into a single example (typically the size of "src" will be the minibatc...
Definition: nnet-example-utils.cc:162

kaldi::nnet3::ChainExampleMerger::eg_to_egs_
MapType eg_to_egs_
Definition: nnet-chain-example.h:273