doc/nnet-computation-graph_8h_source.html

 // nnet3/nnet-computation-graph.h

 // Copyright 2015    Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_NNET3_NNET_COMPUTATION_GRAPH_H_
 #define KALDI_NNET3_NNET_COMPUTATION_GRAPH_H_

 #include "nnet3/nnet-component-itf.h"
 #include "nnet3/nnet-nnet.h"
 #include "nnet3/nnet-computation.h"

 #include <iostream>
 #include <deque>

 namespace kaldi {
 namespace nnet3 {

 struct ComputationGraph {

   std::vector<Cindex> cindexes;

   std::vector<bool> is_input;

   std::vector<std::vector<int32> > dependencies;

   std::vector<int32> segment_ends;

   int32 GetCindexId(const Cindex &cindex, bool is_input, bool *is_new);

   int32 GetCindexId(const Cindex &cindex) const;

   // keeping only for which keep[c - start_cindex_id] is
   void Renumber(int32 start_cindex_id,
                 const std::vector<bool> &keep);


   void Print(std::ostream &os, const std::vector<std::string> &node_names);

  private:
   unordered_map<Cindex, int32, CindexHasher> cindex_to_cindex_id_;
 };


 class ComputationGraphBuilder {
  public:
   ComputationGraphBuilder(const Nnet &nnet,
                           ComputationGraph *graph);

   // Does the initial computation (populating the graph and computing whether
   // each required cindex_id is computable), without the pruning.  In the normal
   // case you call this just once with one 'request', but in the 'online' case
   // you call Compute() [then maybe check AllOutputsAreComputable()] then
   // Prune() multiple times, with a sequence of different requests for
   // increasing time values.
   // Note: it sets the class member request_ to the address of 'request', so
   // you should not let 'request' go out of scope while this class might
   // still use it (e.g. until you call Compute() with a different
   void Compute(const ComputationRequest &request);

   // Returns true if all requested outputs are computable.  To be called after
   // Compute() but before Prune(().
   bool AllOutputsAreComputable() const;

   // Prints logging info to explain why all outputs are not computable.
   // To be called only if AllOutputsAreComputable() returned false.
   void ExplainWhyAllOutputsNotComputable() const;

   // This function outputs to "computable" information about whether each
   // requested element of each output was computable.  "computable" will have
   // the same size as request_->outputs, and each element will have the same
   // size as request_->outputs[i].indexes.size().  May only be called after
   // Compute() but before Prune().  If you have already called Prune(), you can
   // just assume everything was computable, or else Prune() would have crashed.
   void GetComputableInfo(std::vector<std::vector<bool> > *computable) const;

   // to be called after Compute(), this prunes away unused cindex_ids.
   // If not all the outputs are computable, this will die;
   // you can check the return status of AllOutputsAreComputable() first if
   // you want to avoid this.
   void Prune();

   // This enum says for each cindex_id, whether we can compute it from the given
   // inputs or not.  Note that there may be situations where before adding
   // dependencies of a particular cindex_id we realize that we won't be able to
   // use this cindex_id (i.e. it may be computable but it's not used) because
   // its usable_count is zero, and in those cases we change the status to
   // kWillNotCompute even though the cindex-id may be computable.  For most
   // purposes this status is treated the same as kNotComputable.
   enum ComputableInfo {
     kUnknown = 0,
     kComputable = 1,
     kNotComputable = 2,
     kWillNotCompute = 3
   };

   struct CindexInfo {
     ComputableInfo computable;  // kUnknown, kComputable, kNotComputable
     int32 usable_count;   // usable_count_[i] for a cindex_id i is defined as 1 if i is a requested
     // output, and otherwise as the number of other cindex_ids j such that
     // computable_info_[j] is not kNotComputable AND usable_count_[j] > 0 AND i is
     // a member of graph->dependencies[j].  A cindex_id is termed "usable"
     // (meaning it could potentially participate in the computation of the output)
     // if its usable_count_ is > 0.  This quantity is designed to be easy to keep
     // updated as we add cindex_ids.

     // True if in current_queue_ or next_queue_.
     bool queued;

     // True if we have created the cindexes that this cindex depends on.
     bool dependencies_computed;

     CindexInfo(const CindexInfo &other) = default;
     CindexInfo(): computable(kUnknown),
                   usable_count(0),
                   queued(false),
                   dependencies_computed(false) { }
   };

  private:
   // This function, called from ExplainWhyNotComputable(), prints to "os"
   // a human-readable form of a given cindex_id, that looks like
   // some_network_node(n, t, x), e.g. "final_logsoftmax(0, -4, 0)".
   void PrintCindexId(std::ostream &os, int32 cindex_id) const;

   // This function, typically to be called just before dying, prints logging
   // information to explain why the given cindex_id is not computable.
   void ExplainWhyNotComputable(int32 cindex_id) const;

   // called at the start of Compute(), this populates the graph (and member
   // variables) for all the inputs specified in the computation request.
   void AddInputs();

   // called at the start of Compute(), this populates the graph (and member
   // variables, including current_queue_) with all the outputs specified in the
   // computation request.
   void AddOutputs();

   // this does one iteration of building the graph, and increases
   // current_distance_ by one, i.e. it searches at one more remove from
   // the output.
   void BuildGraphOneIter();

   // (called from BuildGraphOneIter()); make sure the computable_info for
   // cindex_id is up to date.  Has side effects: may update usable_count
   // values and add things to next_queue_.
   void UpdateComputableInfo(int32 cindex_id);

   // (called from BuildGraphOneIter()), this function sets the cindex_id to
   // status kWillNotCompute and places members of depend_on_this_ into the
   // computable queue if needed.
   void SetAsWillNotCompute(int32 cindex_id);

   // compute and return the ComputableInfo for this cindex_id (kUnknown,
   // kComputable or kNotComputable).
   ComputableInfo ComputeComputableInfo(int32 cindex_id) const;

   // To be called when this cindex_id has just been newly added to graph_, this
   // function adds a couple default variables associated with it, to *this.
   inline void AddCindexId(int32 cindex_id);

   // Add cindex_ids that this cindex_id depends on.
   void AddDependencies(int32 cindex_id);

   // increment the "usable" value of this cindex_id.
   void IncrementUsableCount(int32 cindex_id);

   // decrement the "usable" value of this cindex_id.
   void DecrementUsableCount(int32 cindex_id);

   // This function, called from Prune(), modifies the members of
   // graph_->dependencies-- it removes those cindexes that are not used in the
   // computation for the current cindex_id.  This will only do something
   // interesting in cases where there are optional dependencies.
   // It also clears the dependencies of those cindexes that are not computable.
   void PruneDependencies(int32 cindex_id);

   // This function, called from Prune(), computes an array "required", with an
   // element for each cindex_id that says whether it is required to compute the
   // requested outputs.  This is similar in function to the "usable_count_"
   // array, but it's more exact because it's computed after we have done
   // PruneDependencies() to remove unused dependencies, so it will only say
   // something is required if it is really accessed in the computation.
   // We'll later use this to remove unnecessary cindexes.
   // 'start_cindex_id' is the cindex_id from which the 'required' array is
   // to start (normally zero, but may be nonzero in multi-segment computations);
   // so 'required' is indexed by cindex_id - start_cindex_id.
   void ComputeRequiredArray(int32 start_cindex_id,
                             std::vector<bool> *required) const;

   // this function, to be called from Compute(), does some sanity checks to
   // verify that the internal state is consistent.  It only does this for the
   // current 'segment' of the computation, starting from 'start_cindex_id' (this
   // will be 0 in normal, single-segment computations).
   void Check(int32 start_cindex_id) const;

   const Nnet &nnet_;
   const ComputationRequest *request_;
   ComputationGraph *graph_;

   // this is the transpose of graph_->dependencies; it tells us
   // for each cindex_id, which other cindex_ids depend on it.
   std::vector<std::vector<int32> > depend_on_this_;


   // this vector is  indexed by cindex_id
   std::vector<CindexInfo> cindex_info_;

   // current_distance_ >= 0 is the distance to the output, of the cindex_ids in
   // current_queue_.
   int32 current_distance_;
   // the cindex_ids in current_queue_ are at no more than distance
   // "current_distance" to the output
   std::vector<int32> current_queue_;
   // the cindex_ids in next_queue_ are at no more than distance current_distance
   // + 1 to the output
   std::vector<int32> next_queue_;
 };

 std::ostream& operator << (std::ostream &os,
                            const ComputationGraphBuilder::ComputableInfo &info);


 class CindexSet {
  public:
   bool operator () (const Cindex &cindex) const;

   CindexSet(const ComputationGraph &graph);

   CindexSet(const ComputationGraph &graph,
             const std::vector<ComputationGraphBuilder::CindexInfo> &info,
             bool treat_unknown_as_computable);
  private:
   const ComputationGraph &graph_;
   const std::vector<ComputationGraphBuilder::CindexInfo> *info_;
   bool treat_unknown_as_computable_;
 };


 class IndexSet {
  public:
   bool operator () (const Index &index) const;

   IndexSet(const ComputationGraph &graph,
            const std::vector<ComputationGraphBuilder::CindexInfo> &info,
            int32 node_id,
            bool treat_unknown_as_computable);
  private:
   const ComputationGraph &graph_;
   const std::vector<ComputationGraphBuilder::CindexInfo> &info_;
   int32 node_id_;
   bool treat_unknown_as_computable_;
 };


 void ComputeComputationPhases(
     const Nnet &nnet,
     const ComputationGraph &computation_graph,
     std::vector<std::vector<std::vector<int32> > > *phases_per_segment);


 class ComputationStepsComputer {
  public:
   ComputationStepsComputer(const Nnet &nnet,
                            ComputationGraph *graph,
                            std::vector<std::vector<int32> > *steps,
                            std::vector<std::pair<int32, int32> > *locations);

   void ComputeForSegment(const ComputationRequest &request,
                          const std::vector<std::vector<int32> > &phases);

   void Check() const;
  private:

   // Adds step(s) for one "sub-phase".  A sub-phase is the set of cindex_ids from
   // one phase that have the same node index.  Note: for nodes that are
   // component-input descriptors, we don't actually create the step here, we
   // create it just before creating the step for its component, and we recreate
   // the list of cindexes from those from the component.  The reason is that
   // there are situations where doing it directly from the raw_step would not do
   // the right thing (especially with non-simple components, it's possible that
   // the cindexes component-input descriptors could be used twice by two
   // different components)..
   void ProcessSubPhase(const ComputationRequest &request,
                        const std::vector<Cindex> &sub_phase);

   // Called from ProcessSubPhase- for the case where it's a DimRangeNode.
   void ProcessDimRangeSubPhase(const std::vector<Cindex> &sub_phase);

   // Called from ProcessSubPhase- for the case where it's an input or output node.
   void ProcessInputOrOutputStep(const ComputationRequest &request,
                                 bool is_output,
                                 const std::vector<Cindex> &sub_phase);

   // Called from ProcessSubPhase- for the case where it's a component node.
   void ProcessComponentStep(const std::vector<Cindex> &step);


   // Splits a phase up into multiple "sub-phases", which are just the cindexes
   // from a phase that are from a single node, sorted.  At this point we
   // represent them as Cindexes, not cindex_ids.  For efficiency and because it
   // would be discarded anyway, it discards any raw steps that correspond to
   // component-input descriptors because these are not processed inside
   // ProcessSubPhase().
   void SplitIntoSubPhases(const std::vector<int32> &phase,
                           std::vector<std::vector<Cindex> > *sub_phase) const;

   // This low-level function used by functions like ProcessComponentStep,
   // ProcessInputStep and so on, adds one step to 'steps_' (converting from
   // Cindex to cindex_ids), and updates 'locations' appropriately.  It returns
   // the step index that we just added (== size of steps_ at entry).
   // If you specify add_if_absent = true, it will add any Cindexes that were
   // not already present, to the graph.  [this option is only to be used
   // in processing dim-range nodes.
   int32 AddStep(const std::vector<Cindex> &cindexes,
                 bool add_if_absent = false);

   // This is an alternative interface to AddStep() that takes a list of
   // cindex_ids instead of cindexes (it's destructive of that list).
   int32 AddStep(std::vector<int32> *cindex_ids);


   // This utility function uses graph_ to convert a vector of cindex_ids into
   // Cindexes.
   void ConvertToCindexes(const std::vector<int32> &cindex_ids,
                          std::vector<Cindex> *cindexes) const;

   // Converts a vector of Cindexes to a vector of Indexes, by
   // stripping out the node index.
   static void ConvertToIndexes(const std::vector<Cindex> &cindexes,
                                std::vector<Index> *indexes);

   // Converts a vector of Indexes to Cindexes, using a supplied
   // node index.
   static void ConvertToCindexes(const std::vector<Index> &indexes,
                                 int32 node_index,
                                 std::vector<Cindex> *cindexes);


   // This utility function uses graph_ to convert a vector of cindex_ids into
   // Cindexes.   It will crash if the cindexes were not present in the graph.
   void ConvertToCindexIds(const std::vector<Cindex> &cindexes,
                           std::vector<int32> *cindex_ids) const;

   // This utility function uses the 'locations_' array to convert the cindex_ids
   // in 'cindex_ids' into an array (of the same length) of locations, i.e. of
   // pairs (step, index-into-step), so that if cindex_ids[i] = c, then
   // (*locations)[i] will be set to (*locations_)[c].  It will die if
   // one of the locations was not defined, i.e. was the pair (-1, -1).
   void ConvertToLocations(
       const std::vector<int32> &cindex_ids,
       std::vector<std::pair<int32, int32> > *locations) const;


   const Nnet &nnet_;
   ComputationGraph *graph_;
   std::vector<std::vector<int32> > *steps_;
   std::vector<std::pair<int32, int32> > *locations_;


   std::unordered_set<std::pair<int32, int32>, PairHasher<int32> > dim_range_nodes_;
 };


 } // namespace nnet3
 } // namespace kaldi


 #endif
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::ComputationStepsComputer::graph_
ComputationGraph * graph_
Definition: nnet-computation-graph.h:543

nnet-nnet.h

nnet-component-itf.h

kaldi::nnet3::ComputationGraphBuilder::graph_
ComputationGraph * graph_
Definition: nnet-computation-graph.h:271

kaldi::nnet3::ConvertToIndexes
bool ConvertToIndexes(const std::vector< std::pair< int32, int32 > > &location_vector, int32 *first_value, std::vector< int32 > *second_values)
If it is the case for some i >= 0 that all the .first elements of "location_vector" are either i or -...
Definition: nnet-compile-utils.cc:190

kaldi::nnet3::IndexSet::treat_unknown_as_computable_
bool treat_unknown_as_computable_
Definition: nnet-computation-graph.h:340

kaldi::nnet3::IndexSet
An abstract representation of a set of Indexes.
Definition: nnet-computation-graph.h:322

kaldi::nnet3::ComputationStepsComputer::locations_
std::vector< std::pair< int32, int32 > > * locations_
locations_ is a map from cindex_id to the pair of indexes into steps_ where that cindex_id resides...
Definition: nnet-computation-graph.h:550

kaldi::nnet3::CindexSet::info_
const std::vector< ComputationGraphBuilder::CindexInfo > * info_
Definition: nnet-computation-graph.h:316

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::operator<<
std::ostream & operator<<(std::ostream &ostream, const Index &index)
Definition: nnet-common.cc:424

kaldi::nnet3::ComputationGraphBuilder::ComputableInfo
ComputableInfo
Definition: nnet-computation-graph.h:162

kaldi::nnet3::CindexSet::treat_unknown_as_computable_
bool treat_unknown_as_computable_
Definition: nnet-computation-graph.h:317

kaldi::nnet3::IndexSet::node_id_
int32 node_id_
Definition: nnet-computation-graph.h:339

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

kaldi::nnet3::ComputationGraphBuilder::current_distance_
int32 current_distance_
Definition: nnet-computation-graph.h:283

nnet-computation.h
The two main classes defined in this header are struct ComputationRequest, which basically defines a ...

kaldi::nnet3::ComputationGraphBuilder::CindexInfo::CindexInfo
CindexInfo()
Definition: nnet-computation-graph.h:186

kaldi::nnet3::IndexSet::graph_
const ComputationGraph & graph_
Definition: nnet-computation-graph.h:337

kaldi::nnet3::Cindex
std::pair< int32, Index > Cindex
Definition: nnet-common.h:115

kaldi::nnet3::ComputationGraph::cindexes
std::vector< Cindex > cindexes
The mapping of cindex_id to Cindex.
Definition: nnet-computation-graph.h:46

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::nnet3::CindexSet
Definition: nnet-computation-graph.h:297

kaldi::nnet3::ComputationGraph::dependencies
std::vector< std::vector< int32 > > dependencies
dependencies[cindex_id] gives you the list of other cindex_ids that this particular cindex_id directl...
Definition: nnet-computation-graph.h:63

kaldi::nnet3::ComputationGraphBuilder::CindexInfo::dependencies_computed
bool dependencies_computed
Definition: nnet-computation-graph.h:183

kaldi::nnet3::ComputationGraph::GetCindexId
int32 GetCindexId(const Cindex &cindex, bool is_input, bool *is_new)
Maps a Cindex to an integer cindex_id.
Definition: nnet-computation-graph.cc:28

kaldi::nnet3::ComputationGraph::cindex_to_cindex_id_
unordered_map< Cindex, int32, CindexHasher > cindex_to_cindex_id_
Maps each Cindex to an integer cindex_id: reverse mapping of "cindexes".
Definition: nnet-computation-graph.h:111

kaldi::nnet3::ComputeComputationPhases
void ComputeComputationPhases(const Nnet &nnet, const ComputationGraph &graph, std::vector< std::vector< std::vector< int32 > > > *phases_per_segment)
This function divides a computation into &#39;phases&#39;, where a &#39;phase&#39; is a collection of cindexes which ...
Definition: nnet-computation-graph.cc:1406

kaldi::nnet3::ComputationGraphBuilder::CindexInfo::queued
bool queued
Definition: nnet-computation-graph.h:180

kaldi::nnet3::ComputationGraphBuilder::cindex_info_
std::vector< CindexInfo > cindex_info_
Definition: nnet-computation-graph.h:279

kaldi::nnet3::ComputationGraph::is_input
std::vector< bool > is_input
For each Cindex this tells us whether it was provided as an input to the network. ...
Definition: nnet-computation-graph.h:55

kaldi::nnet3::ComputationGraphBuilder::depend_on_this_
std::vector< std::vector< int32 > > depend_on_this_
Definition: nnet-computation-graph.h:275

kaldi::nnet3::ComputationGraph::segment_ends
std::vector< int32 > segment_ends
This variable is only of particular interest in a &#39;multi-segment&#39; computation, which is used while cr...
Definition: nnet-computation-graph.h:80

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

kaldi::nnet3::ComputationStepsComputer::steps_
std::vector< std::vector< int32 > > * steps_
steps_ is a pointer to an output that&#39;s passed in in the constructor.
Definition: nnet-computation-graph.h:545

kaldi::nnet3::ComputationGraphBuilder::CindexInfo::usable_count
int32 usable_count
Definition: nnet-computation-graph.h:171

kaldi::nnet3::ComputationGraphBuilder::nnet_
const Nnet & nnet_
Definition: nnet-computation-graph.h:269

kaldi::nnet3::ComputationGraphBuilder::CindexInfo
Definition: nnet-computation-graph.h:169

kaldi::nnet3::ComputationGraph::Renumber
void Renumber(int32 start_cindex_id, const std::vector< bool > &keep)
This function renumbers the cindex-ids (but only those with index c >= start_cindex_id,.
Definition: nnet-computation-graph.cc:57

kaldi::nnet3::ComputationGraphBuilder::current_queue_
std::vector< int32 > current_queue_
Definition: nnet-computation-graph.h:286

kaldi::nnet3::ComputationGraphBuilder::CindexInfo::computable
ComputableInfo computable
Definition: nnet-computation-graph.h:170

kaldi::nnet3::ComputationStepsComputer::dim_range_nodes_
std::unordered_set< std::pair< int32, int32 >, PairHasher< int32 > > dim_range_nodes_
dim_range_nodes_ is used when allocating steps for nodes of type kDimRangeNode.
Definition: nnet-computation-graph.h:559

kaldi::nnet3::IndexSet::info_
const std::vector< ComputationGraphBuilder::CindexInfo > & info_
Definition: nnet-computation-graph.h:338

kaldi::nnet3::CindexSet::graph_
const ComputationGraph & graph_
Definition: nnet-computation-graph.h:315

kaldi::nnet3::ComputationStepsComputer
This class arranges the cindex_ids of the computation into a sequence of lists called "steps"...
Definition: nnet-computation-graph.h:415

kaldi::nnet3::ComputationGraph::Print
void Print(std::ostream &os, const std::vector< std::string > &node_names)
This function, useful for debugging/visualization purposes, prints out a summary of the computation g...
Definition: nnet-computation-graph.cc:176

kaldi::nnet3::ComputationGraphBuilder::request_
const ComputationRequest * request_
Definition: nnet-computation-graph.h:270

kaldi::nnet3::ComputationGraph
The first step in compilation is to turn the ComputationSpecification into a ComputationGraph, where for each Cindex we have a list of other Cindexes that it depends on.
Definition: nnet-computation-graph.h:43

kaldi::nnet3::ComputationGraphBuilder
An abstract representation of a set of Cindexes.
Definition: nnet-computation-graph.h:117

kaldi::nnet3::ComputationStepsComputer::nnet_
const Nnet & nnet_
Definition: nnet-computation-graph.h:542

kaldi::PairHasher
A hashing function-object for pairs of ints.
Definition: stl-utils.h:235

kaldi::nnet3::ComputationGraphBuilder::next_queue_
std::vector< int32 > next_queue_
Definition: nnet-computation-graph.h:289