doc/nnet-discriminative-example_8cc_source.html

 // nnet3/nnet-discriminative-example.cc

 // Copyright      2015    Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <cmath>
 #include "nnet3/nnet-discriminative-example.h"
 #include "nnet3/nnet-example-utils.h"

 namespace kaldi {
 namespace nnet3 {
 using std::string;

 void NnetDiscriminativeSupervision::Write(std::ostream &os, bool binary) const {
   CheckDim();
   WriteToken(os, binary, "<NnetDiscriminativeSup>");
   WriteToken(os, binary, name);
   WriteIndexVector(os, binary, indexes);
   supervision.Write(os, binary);
   WriteToken(os, binary, "<DW>");  // for DerivWeights.  Want to save space.
   WriteVectorAsChar(os, binary, deriv_weights);
   WriteToken(os, binary, "</NnetDiscriminativeSup>");
 }

 bool NnetDiscriminativeSupervision::operator == (const NnetDiscriminativeSupervision &other) const {
   return name == other.name && indexes == other.indexes &&
       supervision == other.supervision &&
       deriv_weights.ApproxEqual(other.deriv_weights);
 }

 void NnetDiscriminativeSupervision::Read(std::istream &is, bool binary) {
   ExpectToken(is, binary, "<NnetDiscriminativeSup>");
   ReadToken(is, binary, &name);
   ReadIndexVector(is, binary, &indexes);
   supervision.Read(is, binary);
   ExpectToken(is, binary, "<DW>");
   ReadVectorAsChar(is, binary, &deriv_weights);
   ExpectToken(is, binary, "</NnetDiscriminativeSup>");
   CheckDim();
 }


 void NnetDiscriminativeSupervision::CheckDim() const {
   if (supervision.frames_per_sequence == -1) {
     // this object has not been set up.
     KALDI_ASSERT(indexes.empty());
     return;
   }
   KALDI_ASSERT(indexes.size() == supervision.num_sequences *
                supervision.frames_per_sequence && !indexes.empty() &&
                supervision.frames_per_sequence > 1);
   int32 first_frame = indexes[0].t,
       frame_skip = indexes[supervision.num_sequences].t - first_frame,
       num_sequences = supervision.num_sequences,
       frames_per_sequence = supervision.frames_per_sequence;
   int32 k = 0;
   for (int32 i = 0; i < frames_per_sequence; i++) {
     for (int32 j = 0; j < num_sequences; j++,k++) {
       int32 n = j, t = i * frame_skip + first_frame, x = 0;
       Index index(n, t, x);
       KALDI_ASSERT(indexes[k] == index);
     }
   }
   if (deriv_weights.Dim() != 0) {
     KALDI_ASSERT(deriv_weights.Dim() == indexes.size());
     KALDI_ASSERT(deriv_weights.Min() >= 0.0 &&
                  deriv_weights.Max() <= 1.0);
   }
 }

 NnetDiscriminativeSupervision::NnetDiscriminativeSupervision(const NnetDiscriminativeSupervision &other):
     name(other.name),
     indexes(other.indexes),
     supervision(other.supervision),
     deriv_weights(other.deriv_weights) { CheckDim(); }

 NnetDiscriminativeSupervision::NnetDiscriminativeSupervision(
     const std::string &name,
     const discriminative::DiscriminativeSupervision &supervision,
     const VectorBase<BaseFloat> &deriv_weights,
     int32 first_frame,
     int32 frame_skip):
     name(name),
     supervision(supervision),
     deriv_weights(deriv_weights) {
   // note: this will set the 'x' index to zero.
   indexes.resize(supervision.num_sequences *
                  supervision.frames_per_sequence);
   int32 k = 0, num_sequences = supervision.num_sequences,
       frames_per_sequence = supervision.frames_per_sequence;
   for (int32 i = 0; i < frames_per_sequence; i++) {
     for (int32 j = 0; j < num_sequences; j++,k++) {
       indexes[k].n = j;
       indexes[k].t = i * frame_skip + first_frame;
     }
   }
   KALDI_ASSERT(k == indexes.size());
   CheckDim();
 }

 void NnetDiscriminativeSupervision::Swap(NnetDiscriminativeSupervision *other) {
   name.swap(other->name);
   indexes.swap(other->indexes);
   supervision.Swap(&(other->supervision));
   deriv_weights.Swap(&(other->deriv_weights));
   if (RandInt(0, 5) == 0)
     CheckDim();
 }


 void NnetDiscriminativeExample::Write(std::ostream &os, bool binary) const {
   // Note: weight, label, input_frames and spk_info are members.  This is a
   // struct.
   WriteToken(os, binary, "<Nnet3DiscriminativeEg>");
   WriteToken(os, binary, "<NumInputs>");
   int32 size = inputs.size();
   WriteBasicType(os, binary, size);
   KALDI_ASSERT(size > 0 && "Attempting to write NnetDiscriminativeExample with no inputs");
   if (!binary) os << '\n';
   for (int32 i = 0; i < size; i++) {
     inputs[i].Write(os, binary);
     if (!binary) os << '\n';
   }
   WriteToken(os, binary, "<NumOutputs>");
   size = outputs.size();
   WriteBasicType(os, binary, size);
   KALDI_ASSERT(size > 0 && "Attempting to write NnetDiscriminativeExample with no outputs");
   if (!binary) os << '\n';
   for (int32 i = 0; i < size; i++) {
     outputs[i].Write(os, binary);
     if (!binary) os << '\n';
   }
   WriteToken(os, binary, "</Nnet3DiscriminativeEg>");
 }

 void NnetDiscriminativeExample::Read(std::istream &is, bool binary) {
   ExpectToken(is, binary, "<Nnet3DiscriminativeEg>");
   ExpectToken(is, binary, "<NumInputs>");
   int32 size;
   ReadBasicType(is, binary, &size);
   if (size < 1 || size > 1000000)
     KALDI_ERR << "Invalid size " << size;
   inputs.resize(size);
   for (int32 i = 0; i < size; i++)
     inputs[i].Read(is, binary);
   ExpectToken(is, binary, "<NumOutputs>");
   ReadBasicType(is, binary, &size);
   if (size < 1 || size > 1000000)
     KALDI_ERR << "Invalid size " << size;
   outputs.resize(size);
   for (int32 i = 0; i < size; i++)
     outputs[i].Read(is, binary);
   ExpectToken(is, binary, "</Nnet3DiscriminativeEg>");
 }

 void NnetDiscriminativeExample::Swap(NnetDiscriminativeExample *other) {
   inputs.swap(other->inputs);
   outputs.swap(other->outputs);
 }

 void NnetDiscriminativeExample::Compress() {
   std::vector<NnetIo>::iterator iter = inputs.begin(), end = inputs.end();
   // calling features.Compress() will do nothing if they are sparse or already
   // compressed.
   for (; iter != end; ++iter) iter->features.Compress();
 }

 NnetDiscriminativeExample::NnetDiscriminativeExample(const NnetDiscriminativeExample &other):
     inputs(other.inputs), outputs(other.outputs) { }

 void MergeSupervision(
     const std::vector<const NnetDiscriminativeSupervision*> &inputs,
     NnetDiscriminativeSupervision *output) {
   int32 num_inputs = inputs.size(),
       num_indexes = 0;
   for (int32 n = 0; n < num_inputs; n++) {
     KALDI_ASSERT(inputs[n]->name == inputs[0]->name);
     num_indexes += inputs[n]->indexes.size();
   }
   output->name = inputs[0]->name;
   std::vector<const discriminative::DiscriminativeSupervision*> input_supervision;
   input_supervision.reserve(inputs.size());
   for (int32 n = 0; n < num_inputs; n++)
     input_supervision.push_back(&(inputs[n]->supervision));
   discriminative::DiscriminativeSupervision output_supervision;
   discriminative::MergeSupervision(input_supervision,
                          &output_supervision);
   output->supervision.Swap(&(output_supervision));

   output->indexes.clear();
   output->indexes.reserve(num_indexes);
   for (int32 n = 0; n < num_inputs; n++) {
     const std::vector<Index> &src_indexes = inputs[n]->indexes;
     int32 cur_size = output->indexes.size();
     output->indexes.insert(output->indexes.end(),
                            src_indexes.begin(), src_indexes.end());
     std::vector<Index>::iterator iter = output->indexes.begin() + cur_size,
         end = output->indexes.end();
     // change the 'n' index to correspond to the index into 'input'.
     // Each example gets a different 'n' value, starting from 0.
     for (; iter != end; ++iter) {
       KALDI_ASSERT(iter->n == 0 && "Merging already-merged discriminative egs");
       iter->n = n;
     }
   }
   KALDI_ASSERT(output->indexes.size() == num_indexes);
   // OK, at this point the 'indexes' will be in the wrong order,
   // because they should be first sorted by 't' and next by 'n'.
   // 'sort' will fix this, due to the operator < on type Index.
   // TODO: Is this required?
   std::sort(output->indexes.begin(), output->indexes.end());

   // merge the deriv_weights.
   if (inputs[0]->deriv_weights.Dim() != 0) {
     int32 frames_per_sequence = inputs[0]->deriv_weights.Dim();
     output->deriv_weights.Resize(output->indexes.size(), kUndefined);
     KALDI_ASSERT(output->deriv_weights.Dim() ==
                  frames_per_sequence * num_inputs);
     for (int32 n = 0; n < num_inputs; n++) {
       const Vector<BaseFloat> &src_deriv_weights = inputs[n]->deriv_weights;
       KALDI_ASSERT(src_deriv_weights.Dim() == frames_per_sequence);
       // the ordering of the deriv_weights corresponds to the ordering of the
       // Indexes, where the time dimension has the greater stride.
       for (int32 t = 0; t < frames_per_sequence; t++) {
         output->deriv_weights(t * num_inputs + n) = src_deriv_weights(t);
       }
     }
   }
   output->CheckDim();
 }


 void MergeDiscriminativeExamples(
     bool compress,
     std::vector<NnetDiscriminativeExample> *input,
     NnetDiscriminativeExample *output) {
   int32 num_examples = input->size();
   KALDI_ASSERT(num_examples > 0);
   // we temporarily make the input-features in 'input' look like regular
   // NnetExamples, so that we can recycle the
   // MergeExamples() function.
   std::vector<NnetExample> eg_inputs(num_examples);
   for (int32 i = 0; i < num_examples; i++)
     eg_inputs[i].io.swap((*input)[i].inputs);
   NnetExample eg_output;
   MergeExamples(eg_inputs, compress, &eg_output);
   // swap the inputs back so that they are not really changed.
   for (int32 i = 0; i < num_examples; i++)
     eg_inputs[i].io.swap((*input)[i].inputs);
   // write to 'output->inputs'
   eg_output.io.swap(output->inputs);

   // Now deal with the discriminative-supervision 'outputs'.  There will
   // normally be just one of these, with name "output", but we
   // handle the more general case.
   int32 num_output_names = (*input)[0].outputs.size();
   output->outputs.resize(num_output_names);
   for (int32 i = 0; i < num_output_names; i++) {
     std::vector<const NnetDiscriminativeSupervision*> to_merge(num_examples);
     for (int32 j = 0; j < num_examples; j++) {
       KALDI_ASSERT((*input)[j].outputs.size() == num_output_names);
       to_merge[j] = &((*input)[j].outputs[i]);
     }
     MergeSupervision(to_merge,
                      &(output->outputs[i]));
   }
 }


 void GetDiscriminativeComputationRequest(const Nnet &nnet,
                                          const NnetDiscriminativeExample &eg,
                                          bool need_model_derivative,
                                          bool store_component_stats,
                                          bool use_xent_regularization,
                                          bool use_xent_derivative,
                                          ComputationRequest *request) {
   request->inputs.clear();
   request->inputs.reserve(eg.inputs.size());
   request->outputs.clear();
   request->outputs.reserve(eg.outputs.size());
   request->need_model_derivative = need_model_derivative;
   request->store_component_stats = store_component_stats;
   for (size_t i = 0; i < eg.inputs.size(); i++) {
     const NnetIo &io = eg.inputs[i];
     const std::string &name = io.name;
     int32 node_index = nnet.GetNodeIndex(name);
     if (node_index == -1 &&
         !nnet.IsInputNode(node_index))
       KALDI_ERR << "Nnet example has input named '" << name
                 << "', but no such input node is in the network.";

     request->inputs.resize(request->inputs.size() + 1);
     IoSpecification &io_spec = request->inputs.back();
     io_spec.name = name;
     io_spec.indexes = io.indexes;
     io_spec.has_deriv = false;
   }
   for (size_t i = 0; i < eg.outputs.size(); i++) {
     // there will normally be exactly one output , named "output"
     const NnetDiscriminativeSupervision &sup = eg.outputs[i];
     const std::string &name = sup.name;
     int32 node_index = nnet.GetNodeIndex(name);
     if (node_index == -1 &&
         !nnet.IsOutputNode(node_index))
       KALDI_ERR << "Nnet example has output named '" << name
                 << "', but no such output node is in the network.";
     request->outputs.resize(request->outputs.size() + 1);
     IoSpecification &io_spec = request->outputs.back();
     io_spec.name = name;
     io_spec.indexes = sup.indexes;
     io_spec.has_deriv = need_model_derivative;

     if (use_xent_regularization) {
       size_t cur_size = request->outputs.size();
       request->outputs.resize(cur_size + 1);
       IoSpecification &io_spec = request->outputs[cur_size - 1],
           &io_spec_xent = request->outputs[cur_size];
       // the IoSpecification for the -xent output is the same
       // as for the regular output, except for its name which has
       // the -xent suffix (and the has_deriv member may differ).
       io_spec_xent = io_spec;
       io_spec_xent.name = name + "-xent";
       io_spec_xent.has_deriv = use_xent_derivative;
     }
   }
   // check to see if something went wrong.
   if (request->inputs.empty())
     KALDI_ERR << "No inputs in computation request.";
   if (request->outputs.empty())
     KALDI_ERR << "No outputs in computation request.";
 }

 void ShiftDiscriminativeExampleTimes(int32 frame_shift,
                             const std::vector<std::string> &exclude_names,
                             NnetDiscriminativeExample *eg) {
   std::vector<NnetIo>::iterator input_iter = eg->inputs.begin(),
       input_end = eg->inputs.end();
   for (; input_iter != input_end; ++input_iter) {
     bool must_exclude = false;
     std::vector<string>::const_iterator exclude_iter = exclude_names.begin(),
         exclude_end = exclude_names.end();
     for (; exclude_iter != exclude_end; ++exclude_iter)
       if (input_iter->name == *exclude_iter)
         must_exclude = true;
     if (!must_exclude) {
       std::vector<Index>::iterator indexes_iter = input_iter->indexes.begin(),
           indexes_end = input_iter->indexes.end();
       for (; indexes_iter != indexes_end; ++indexes_iter)
         indexes_iter->t += frame_shift;
     }
   }
   // note: we'll normally choose a small enough shift that the output-data
   // shift will be zero after dividing by frame_subsampling_factor
   // (e.g. frame_subsampling_factor == 3 and shift = 0 or 1.
   std::vector<NnetDiscriminativeSupervision>::iterator
       sup_iter = eg->outputs.begin(),
       sup_end = eg->outputs.end();
   for (; sup_iter != sup_end; ++sup_iter) {
     std::vector<Index> &indexes = sup_iter->indexes;
     KALDI_ASSERT(indexes.size() >= 2 && indexes[0].n == indexes[1].n &&
                  indexes[0].x == indexes[1].x);
     int32 frame_subsampling_factor = indexes[1].t - indexes[0].t;
     KALDI_ASSERT(frame_subsampling_factor > 0);

     // We need to shift by a multiple of frame_subsampling_factor.
     // Round to the closest multiple.
     int32 supervision_frame_shift =
         frame_subsampling_factor *
         std::floor(0.5 + (frame_shift * 1.0 / frame_subsampling_factor));
     if (supervision_frame_shift == 0)
       continue;
     std::vector<Index>::iterator indexes_iter = indexes.begin(),
         indexes_end = indexes.end();
     for (; indexes_iter != indexes_end; ++indexes_iter)
       indexes_iter->t += supervision_frame_shift;
   }
 }

 size_t NnetDiscriminativeExampleStructureHasher::operator () (
     const NnetDiscriminativeExample &eg) const noexcept {
   // these numbers were chosen at random from a list of primes.
   NnetIoStructureHasher io_hasher;
   size_t size = eg.inputs.size(), ans = size * 35099;
   for (size_t i = 0; i < size; i++)
     ans = ans * 19157 + io_hasher(eg.inputs[i]);
   for (size_t i = 0; i < eg.outputs.size(); i++) {
     const NnetDiscriminativeSupervision &sup = eg.outputs[i];
     StringHasher string_hasher;
     IndexVectorHasher indexes_hasher;
     ans = ans * 17957 +
         string_hasher(sup.name) + indexes_hasher(sup.indexes);
   }
   return ans;
 }

 bool NnetDiscriminativeExampleStructureCompare::operator () (
     const NnetDiscriminativeExample &a,
     const NnetDiscriminativeExample &b) const {
   NnetIoStructureCompare io_compare;
   if (a.inputs.size() != b.inputs.size() ||
       a.outputs.size() != b.outputs.size())
     return false;
   size_t size = a.inputs.size();
   for (size_t i = 0; i < size; i++)
     if (!io_compare(a.inputs[i], b.inputs[i]))
       return false;
   size = a.outputs.size();
   for (size_t i = 0; i < size; i++)
     if (a.outputs[i].name != b.outputs[i].name ||
         a.outputs[i].indexes != b.outputs[i].indexes)
       return false;
   return true;
 }


 int32 GetNnetDiscriminativeExampleSize(const NnetDiscriminativeExample &a) {
   int32 ans = 0;
   for (size_t i = 0; i < a.inputs.size(); i++) {
     int32 s = a.inputs[i].indexes.size();
     if (s > ans)
       ans = s;
   }
   for (size_t i = 0; i < a.outputs.size(); i++) {
     int32 s = a.outputs[i].indexes.size();
     if (s > ans)
       ans = s;
   }
   return ans;
 }


 DiscriminativeExampleMerger::DiscriminativeExampleMerger(const ExampleMergingConfig &config,
                              NnetDiscriminativeExampleWriter *writer):
     finished_(false), num_egs_written_(0),
     config_(config), writer_(writer) { }


 void DiscriminativeExampleMerger::AcceptExample(NnetDiscriminativeExample *eg) {
   KALDI_ASSERT(!finished_);
   // If an eg with the same structure as 'eg' is already a key in the
   // map, it won't be replaced, but if it's new it will be made
   // the key.  Also we remove the key before making the vector empty.
   // This way we ensure that the eg in the key is always the first
   // element of the vector.
   std::vector<NnetDiscriminativeExample*> &vec = eg_to_egs_[eg];
   vec.push_back(eg);
   int32 eg_size = GetNnetDiscriminativeExampleSize(*eg),
       num_available = vec.size();
   bool input_ended = false;
   int32 minibatch_size = config_.MinibatchSize(eg_size, num_available,
                                                input_ended);
   if (minibatch_size != 0) {  // we need to write out a merged eg.
     KALDI_ASSERT(minibatch_size == num_available);

     std::vector<NnetDiscriminativeExample*> vec_copy(vec);
     eg_to_egs_.erase(eg);

     // MergeDiscriminativeExamples() expects a vector of NnetDiscriminativeExample, not of pointers,
     // so use swap to create that without doing any real work.
     std::vector<NnetDiscriminativeExample> egs_to_merge(minibatch_size);
     for (int32 i = 0; i < minibatch_size; i++) {
       egs_to_merge[i].Swap(vec_copy[i]);
       delete vec_copy[i];  // we owned those pointers.
     }
     WriteMinibatch(&egs_to_merge);
   }
 }

 void DiscriminativeExampleMerger::WriteMinibatch(
     std::vector<NnetDiscriminativeExample> *egs) {
   KALDI_ASSERT(!egs->empty());
   int32 eg_size = GetNnetDiscriminativeExampleSize((*egs)[0]);
   NnetDiscriminativeExampleStructureHasher eg_hasher;
   size_t structure_hash = eg_hasher((*egs)[0]);
   int32 minibatch_size = egs->size();
   stats_.WroteExample(eg_size, structure_hash, minibatch_size);
   NnetDiscriminativeExample merged_eg;
   MergeDiscriminativeExamples(config_.compress, egs, &merged_eg);
   std::ostringstream key;
   key << "merged-" << (num_egs_written_++) << "-" << minibatch_size;
   writer_->Write(key.str(), merged_eg);
 }

 void DiscriminativeExampleMerger::Finish() {
   if (finished_) return;  // already finished.
   finished_ = true;

   // we'll convert the map eg_to_egs_ to a vector of vectors to avoid
   // iterator invalidation problems.
   std::vector<std::vector<NnetDiscriminativeExample*> > all_egs;
   all_egs.reserve(eg_to_egs_.size());

   MapType::iterator iter = eg_to_egs_.begin(), end = eg_to_egs_.end();
   for (; iter != end; ++iter)
     all_egs.push_back(iter->second);
   eg_to_egs_.clear();

   for (size_t i = 0; i < all_egs.size(); i++) {
     int32 minibatch_size;
     std::vector<NnetDiscriminativeExample*> &vec = all_egs[i];
     KALDI_ASSERT(!vec.empty());
     int32 eg_size = GetNnetDiscriminativeExampleSize(*(vec[0]));
     bool input_ended = true;
     while (!vec.empty() &&
            (minibatch_size = config_.MinibatchSize(eg_size, vec.size(),
                                                    input_ended)) != 0) {
       // MergeDiscriminativeExamples() expects a vector of
       // NnetDiscriminativeExample, not of pointers, so use swap to create that
       // without doing any real work.
       std::vector<NnetDiscriminativeExample> egs_to_merge(minibatch_size);
       for (int32 i = 0; i < minibatch_size; i++) {
         egs_to_merge[i].Swap(vec[i]);
         delete vec[i];  // we owned those pointers.
       }
       vec.erase(vec.begin(), vec.begin() + minibatch_size);
       WriteMinibatch(&egs_to_merge);
     }
     if (!vec.empty()) {
       int32 eg_size = GetNnetDiscriminativeExampleSize(*(vec[0]));
       NnetDiscriminativeExampleStructureHasher eg_hasher;
       size_t structure_hash = eg_hasher(*(vec[0]));
       int32 num_discarded = vec.size();
       stats_.DiscardedExamples(eg_size, structure_hash, num_discarded);
       for (int32 i = 0; i < num_discarded; i++)
         delete vec[i];
       vec.clear();
     }
   }
   stats_.PrintStats();
 }


 } // namespace nnet3
 } // namespace kaldi
kaldi::nnet3::NnetExample
NnetExample is the input data and corresponding label (or labels) for one or more frames of input...
Definition: nnet-example.h:111

kaldi::nnet3::ShiftDiscriminativeExampleTimes
void ShiftDiscriminativeExampleTimes(int32 frame_shift, const std::vector< std::string > &exclude_names, NnetDiscriminativeExample *eg)
Shifts the time-index t of everything in the input of "eg" by adding "t_offset" to all "t" values– b...
Definition: nnet-discriminative-example.cc:347

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::NnetIo
Definition: nnet-example.h:33

kaldi::nnet3::ExampleMergingConfig::compress
bool compress
Definition: nnet-example-utils.h:324

kaldi::nnet3::WriteIndexVector
void WriteIndexVector(std::ostream &os, bool binary, const std::vector< Index > &vec)
Definition: nnet-common.cc:126

kaldi::nnet3::ExampleMergingStats::DiscardedExamples
void DiscardedExamples(int32 example_size, size_t structure_hash, int32 num_discarded)
Users call this function to inform this class that after processing all the data, for examples of ori...
Definition: nnet-example-utils.cc:1065

kaldi::nnet3::DiscriminativeExampleMerger::AcceptExample
void AcceptExample(NnetDiscriminativeExample *a)
Definition: nnet-discriminative-example.cc:452

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::nnet3::ComputationRequest::store_component_stats
bool store_component_stats
you should set need_component_stats to true if you need the average-activation and average-derivative...
Definition: nnet-computation.h:126

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::NnetDiscriminativeSupervision::CheckDim
void CheckDim() const
Definition: nnet-discriminative-example.cc:57

kaldi::nnet3::ComputationRequest::need_model_derivative
bool need_model_derivative
if need_model_derivative is true, then we&#39;ll be doing either model training or model-derivative compu...
Definition: nnet-computation.h:121

kaldi::nnet3::DiscriminativeExampleMerger::writer_
NnetDiscriminativeExampleWriter * writer_
Definition: nnet-discriminative-example.h:259

kaldi::nnet3::IndexVectorHasher
Definition: nnet-common.h:131

kaldi::discriminative::DiscriminativeSupervision::Write
void Write(std::ostream &os, bool binary) const
Definition: discriminative-supervision.cc:51

kaldi::ReadBasicType
void ReadBasicType(std::istream &is, bool binary, T *t)
ReadBasicType is the name of the read function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:55

kaldi::nnet3::NnetDiscriminativeSupervision::name
std::string name
Definition: nnet-discriminative-example.h:45

kaldi::nnet3::Nnet::IsInputNode
bool IsInputNode(int32 node) const
Returns true if this is an output node, meaning that it is of type kInput.
Definition: nnet-nnet.cc:120

kaldi::nnet3::MergeSupervision
static void MergeSupervision(const std::vector< const NnetChainSupervision *> &inputs, NnetChainSupervision *output)
Definition: nnet-chain-example.cc:195

kaldi::nnet3::ExampleMergingConfig::MinibatchSize
int32 MinibatchSize(int32 size_of_eg, int32 num_available_egs, bool input_ended) const
This function tells you what minibatch size should be used for this eg.
Definition: nnet-example-utils.cc:1017

kaldi::TableWriter
A templated class for writing objects to an archive or script file; see The Table concept...
Definition: kaldi-table.h:368

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::ReadToken
void ReadToken(std::istream &is, bool binary, std::string *str)
ReadToken gets the next token and puts it in str (exception on failure).
Definition: io-funcs.cc:154

kaldi::nnet3::ComputationRequest::inputs
std::vector< IoSpecification > inputs
Definition: nnet-computation.h:115

kaldi::discriminative::MergeSupervision
void MergeSupervision(const std::vector< const DiscriminativeSupervision *> &input, DiscriminativeSupervision *output_supervision)
This function appends a list of supervision objects to create what will usually be a single such obje...
Definition: discriminative-supervision.cc:402

kaldi::nnet3::NnetIo::indexes
std::vector< Index > indexes
"indexes" is a vector the same length as features.NumRows(), explaining the meaning of each row of th...
Definition: nnet-example.h:42

kaldi::nnet3::IoSpecification::name
std::string name
Definition: nnet-computation.h:73

kaldi::StringHasher
A hashing function object for strings.
Definition: stl-utils.h:248

kaldi::nnet3::NnetDiscriminativeExampleStructureCompare::operator()
bool operator()(const NnetDiscriminativeExample &a, const NnetDiscriminativeExample &b) const
Definition: nnet-discriminative-example.cc:410

kaldi::nnet3::DiscriminativeExampleMerger::eg_to_egs_
MapType eg_to_egs_
Definition: nnet-discriminative-example.h:267

kaldi::nnet3::NnetDiscriminativeExampleStructureHasher
This hashing object hashes just the structural aspects of the NnetExample without looking at the valu...
Definition: nnet-discriminative-example.h:136

kaldi::TableWriter::Write
void Write(const std::string &key, const T &value) const
Definition: kaldi-table-inl.h:1511

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

kaldi::nnet3::ExampleMergingConfig
Definition: nnet-example-utils.h:321

kaldi::discriminative::DiscriminativeSupervision::Swap
void Swap(DiscriminativeSupervision *other)
Definition: discriminative-supervision.cc:34

kaldi::nnet3::ExampleMergingStats::PrintStats
void PrintStats() const
Calling this will cause a log message with information about the examples to be printed.
Definition: nnet-example-utils.cc:1073

kaldi::nnet3::WriteVectorAsChar
void WriteVectorAsChar(std::ostream &os, bool binary, const VectorBase< BaseFloat > &vec)
Definition: nnet-example-utils.cc:237

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::nnet3::NnetDiscriminativeExample::Read
void Read(std::istream &is, bool binary)
Definition: nnet-discriminative-example.cc:150

kaldi::nnet3::DiscriminativeExampleMerger::WriteMinibatch
void WriteMinibatch(std::vector< NnetDiscriminativeExample > *egs)
Definition: nnet-discriminative-example.cc:483

kaldi::nnet3::NnetDiscriminativeSupervision::NnetDiscriminativeSupervision
NnetDiscriminativeSupervision()
Definition: nnet-discriminative-example.h:74

kaldi::nnet3::Nnet::IsOutputNode
bool IsOutputNode(int32 node) const
Returns true if this is an output node, meaning that it is of type kDescriptor and is not directly fo...
Definition: nnet-nnet.cc:112

kaldi::nnet3::ExpectToken
static void ExpectToken(const std::string &token, const std::string &what_we_are_parsing, const std::string **next_token)
Definition: nnet-descriptor.cc:45

kaldi::nnet3::NnetDiscriminativeExampleStructureHasher::operator()
size_t operator()(const NnetDiscriminativeExample &eg) const noexcept
Definition: nnet-discriminative-example.cc:393

kaldi::nnet3::NnetDiscriminativeExample::Compress
void Compress()
Definition: nnet-discriminative-example.cc:175

rnnlm::n
struct rnnlm::@11::@12 n

kaldi::nnet3::NnetDiscriminativeSupervision::Write
void Write(std::ostream &os, bool binary) const
Definition: nnet-discriminative-example.cc:28

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

kaldi::discriminative::DiscriminativeSupervision::num_sequences
int32 num_sequences
Definition: discriminative-supervision.h:85

nnet-example-utils.h

kaldi::discriminative::DiscriminativeSupervision::Read
void Read(std::istream &is, bool binary)
Definition: discriminative-supervision.cc:75

kaldi::discriminative::DiscriminativeSupervision::frames_per_sequence
int32 frames_per_sequence
Definition: discriminative-supervision.h:91

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::WriteToken
void WriteToken(std::ostream &os, bool binary, const char *token)
The WriteToken functions are for writing nonempty sequences of non-space characters.
Definition: io-funcs.cc:134

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::nnet3::NnetDiscriminativeSupervision::Swap
void Swap(NnetDiscriminativeSupervision *other)
Definition: nnet-discriminative-example.cc:115

kaldi::nnet3::ReadIndexVector
void ReadIndexVector(std::istream &is, bool binary, std::vector< Index > *vec)
Definition: nnet-common.cc:143

kaldi::nnet3::ExampleMergingStats::WroteExample
void WroteExample(int32 example_size, size_t structure_hash, int32 minibatch_size)
Users call this function to inform this class that one minibatch has been written aggregating &#39;miniba...
Definition: nnet-example-utils.cc:1051

kaldi::nnet3::IoSpecification
Definition: nnet-computation.h:72

kaldi::discriminative::DiscriminativeSupervision
Definition: discriminative-supervision.h:75

kaldi::nnet3::IoSpecification::has_deriv
bool has_deriv
Definition: nnet-computation.h:75

kaldi::nnet3::DiscriminativeExampleMerger::stats_
ExampleMergingStats stats_
Definition: nnet-discriminative-example.h:260

kaldi::nnet3::DiscriminativeExampleMerger::DiscriminativeExampleMerger
DiscriminativeExampleMerger(const ExampleMergingConfig &config, NnetDiscriminativeExampleWriter *writer)
Definition: nnet-discriminative-example.cc:446

kaldi::nnet3::DiscriminativeExampleMerger::finished_
bool finished_
Definition: nnet-discriminative-example.h:256

kaldi::nnet3::NnetDiscriminativeExample::NnetDiscriminativeExample
NnetDiscriminativeExample()
Definition: nnet-discriminative-example.h:123

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

nnet-discriminative-example.h

kaldi::nnet3::IoSpecification::indexes
std::vector< Index > indexes
Definition: nnet-computation.h:74

kaldi::nnet3::NnetDiscriminativeSupervision::indexes
std::vector< Index > indexes
Definition: nnet-discriminative-example.h:54

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet3::NnetDiscriminativeExample::Swap
void Swap(NnetDiscriminativeExample *other)
Definition: nnet-discriminative-example.cc:170

kaldi::nnet3::ComputationRequest::outputs
std::vector< IoSpecification > outputs
Definition: nnet-computation.h:116

kaldi::nnet3::NnetIoStructureCompare
This comparison object compares just the structural aspects of the NnetIo object (name, indexes, feature dimension) without looking at the value of features.
Definition: nnet-example.h:101

kaldi::nnet3::NnetDiscriminativeSupervision::deriv_weights
Vector< BaseFloat > deriv_weights
Definition: nnet-discriminative-example.h:71

kaldi::nnet3::NnetDiscriminativeExample::inputs
std::vector< NnetIo > inputs
&#39;inputs&#39; contains the input to the network– normally just it has just one element called "input"...
Definition: nnet-discriminative-example.h:108

kaldi::nnet3::NnetDiscriminativeExample::outputs
std::vector< NnetDiscriminativeSupervision > outputs
&#39;outputs&#39; contains the sequence output supervision.
Definition: nnet-discriminative-example.h:112

kaldi::nnet3::NnetIoStructureHasher
This hashing object hashes just the structural aspects of the NnetIo object (name, indexes, feature dimension) without looking at the value of features.
Definition: nnet-example.h:94

kaldi::nnet3::ReadVectorAsChar
void ReadVectorAsChar(std::istream &is, bool binary, Vector< BaseFloat > *vec)
Definition: nnet-example-utils.cc:258

kaldi::nnet3::DiscriminativeExampleMerger::Finish
void Finish()
Definition: nnet-discriminative-example.cc:498

kaldi::nnet3::MergeDiscriminativeExamples
void MergeDiscriminativeExamples(bool compress, std::vector< NnetDiscriminativeExample > *input, NnetDiscriminativeExample *output)
Definition: nnet-discriminative-example.cc:247

kaldi::nnet3::GetNnetDiscriminativeExampleSize
int32 GetNnetDiscriminativeExampleSize(const NnetDiscriminativeExample &a)
Definition: nnet-discriminative-example.cc:430

kaldi::nnet3::GetDiscriminativeComputationRequest
void GetDiscriminativeComputationRequest(const Nnet &nnet, const NnetDiscriminativeExample &eg, bool need_model_derivative, bool store_component_stats, bool use_xent_regularization, bool use_xent_derivative, ComputationRequest *request)
This function takes a NnetDiscriminativeExample and produces a ComputationRequest.
Definition: nnet-discriminative-example.cc:284

kaldi::WriteBasicType
void WriteBasicType(std::ostream &os, bool binary, T t)
WriteBasicType is the name of the write function for bool, integer types, and floating-point types...
Definition: io-funcs-inl.h:34

kaldi::nnet3::NnetIo::name
std::string name
the name of the input in the neural net; in simple setups it will just be "input".
Definition: nnet-example.h:36

kaldi::nnet3::NnetDiscriminativeSupervision::operator==
bool operator==(const NnetDiscriminativeSupervision &other) const
Definition: nnet-discriminative-example.cc:39

kaldi::nnet3::DiscriminativeExampleMerger::config_
const ExampleMergingConfig & config_
Definition: nnet-discriminative-example.h:258

kaldi::nnet3::Nnet::GetNodeIndex
int32 GetNodeIndex(const std::string &node_name) const
returns index associated with this node name, or -1 if no such index.
Definition: nnet-nnet.cc:466

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::nnet3::NnetDiscriminativeSupervision::supervision
discriminative::DiscriminativeSupervision supervision
Definition: nnet-discriminative-example.h:58

kaldi::nnet3::NnetExample::io
std::vector< NnetIo > io
"io" contains the input and output.
Definition: nnet-example.h:116

kaldi::nnet3::DiscriminativeExampleMerger::num_egs_written_
int32 num_egs_written_
Definition: nnet-discriminative-example.h:257

kaldi::nnet3::NnetDiscriminativeSupervision
Definition: nnet-discriminative-example.h:42

kaldi::nnet3::NnetDiscriminativeExample::Write
void Write(std::ostream &os, bool binary) const
Definition: nnet-discriminative-example.cc:125

kaldi::nnet3::NnetDiscriminativeExample
NnetDiscriminativeExample is like NnetExample, but specialized for sequence training.
Definition: nnet-discriminative-example.h:103

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95

kaldi::nnet3::NnetDiscriminativeSupervision::Read
void Read(std::istream &is, bool binary)
Definition: nnet-discriminative-example.cc:45

kaldi::nnet3::MergeExamples
void MergeExamples(const std::vector< NnetExample > &src, bool compress, NnetExample *merged_eg)
Merge a set of input examples into a single example (typically the size of "src" will be the minibatc...
Definition: nnet-example-utils.cc:162