doc/faster-decoder_8h_source.html

 // decoder/faster-decoder.h

 // Copyright 2009-2011  Microsoft Corporation
 //                2013  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_DECODER_FASTER_DECODER_H_
 #define KALDI_DECODER_FASTER_DECODER_H_

 #include "util/stl-utils.h"
 #include "itf/options-itf.h"
 #include "util/hash-list.h"
 #include "fst/fstlib.h"
 #include "itf/decodable-itf.h"
 #include "lat/kaldi-lattice.h" // for CompactLatticeArc

 namespace kaldi {

 struct FasterDecoderOptions {
   BaseFloat beam;
   int32 max_active;
   int32 min_active;
   BaseFloat beam_delta;
   BaseFloat hash_ratio;
   FasterDecoderOptions(): beam(16.0),
                           max_active(std::numeric_limits<int32>::max()),
                           min_active(20), // This decoder mostly used for
                                           // alignment, use small default.
                           beam_delta(0.5),
                           hash_ratio(2.0) { }
   void Register(OptionsItf *opts, bool full) {
     opts->Register("beam", &beam, "Decoding beam.  Larger->slower, more accurate.");
     opts->Register("max-active", &max_active, "Decoder max active states.  Larger->slower; "
                    "more accurate");
     opts->Register("min-active", &min_active,
                    "Decoder min active states (don't prune if #active less than this).");
     if (full) {
       opts->Register("beam-delta", &beam_delta,
                      "Increment used in decoder [obscure setting]");
       opts->Register("hash-ratio", &hash_ratio,
                      "Setting used in decoder to control hash behavior");
     }
   }
 };

 class FasterDecoder {
  public:
   typedef fst::StdArc Arc;
   typedef Arc::Label Label;
   typedef Arc::StateId StateId;
   typedef Arc::Weight Weight;

   FasterDecoder(const fst::Fst<fst::StdArc> &fst,
                 const FasterDecoderOptions &config);

   void SetOptions(const FasterDecoderOptions &config) { config_ = config; }

   ~FasterDecoder() { ClearToks(toks_.Clear()); }

   void Decode(DecodableInterface *decodable);

   bool ReachedFinal() const;

   bool GetBestPath(fst::MutableFst<LatticeArc> *fst_out,
                    bool use_final_probs = true);

   void InitDecoding();


   void AdvanceDecoding(DecodableInterface *decodable,
                        int32 max_num_frames = -1);

   int32 NumFramesDecoded() const { return num_frames_decoded_; }

  protected:

   class Token {
    public:
     Arc arc_; // contains only the graph part of the cost;
     // we can work out the acoustic part from difference between
     // "cost_" and prev->cost_.
     Token *prev_;
     int32 ref_count_;
     // if you are looking for weight_ here, it was removed and now we just have
     // cost_, which corresponds to ConvertToCost(weight_).
     double cost_;
     inline Token(const Arc &arc, BaseFloat ac_cost, Token *prev):
         arc_(arc), prev_(prev), ref_count_(1) {
       if (prev) {
         prev->ref_count_++;
         cost_ = prev->cost_ + arc.weight.Value() + ac_cost;
       } else {
         cost_ = arc.weight.Value() + ac_cost;
       }
     }
     inline Token(const Arc &arc, Token *prev):
         arc_(arc), prev_(prev), ref_count_(1) {
       if (prev) {
         prev->ref_count_++;
         cost_ = prev->cost_ + arc.weight.Value();
       } else {
         cost_ = arc.weight.Value();
       }
     }
     inline bool operator < (const Token &other) {
       return cost_ > other.cost_;
     }

     inline static void TokenDelete(Token *tok) {
       while (--tok->ref_count_ == 0) {
         Token *prev = tok->prev_;
         delete tok;
         if (prev == NULL) return;
         else tok = prev;
       }
 #ifdef KALDI_PARANOID
       KALDI_ASSERT(tok->ref_count_ > 0);
 #endif
     }
   };
   typedef HashList<StateId, Token*>::Elem Elem;


   double GetCutoff(Elem *list_head, size_t *tok_count,
                    BaseFloat *adaptive_beam, Elem **best_elem);

   void PossiblyResizeHash(size_t num_toks);

   // ProcessEmitting returns the likelihood cutoff used.
   // It decodes the frame num_frames_decoded_ of the decodable object
   // and then increments num_frames_decoded_
   double ProcessEmitting(DecodableInterface *decodable);

   // TODO: first time we go through this, could avoid using the queue.
   void ProcessNonemitting(double cutoff);

   // HashList defined in ../util/hash-list.h.  It actually allows us to maintain
   // more than one list (e.g. for current and previous frames), but only one of
   // them at a time can be indexed by StateId.
   HashList<StateId, Token*> toks_;
   const fst::Fst<fst::StdArc> &fst_;
   FasterDecoderOptions config_;
   std::vector<const Elem* > queue_;  // temp variable used in ProcessNonemitting,
   std::vector<BaseFloat> tmp_array_;  // used in GetCutoff.
   // make it class member to avoid internal new/delete.

   // Keep track of the number of frames decoded in the current file.
   int32 num_frames_decoded_;

   // It might seem unclear why we call ClearToks(toks_.Clear()).
   // There are two separate cleanup tasks we need to do at when we start a new file.
   // one is to delete the Token objects in the list; the other is to delete
   // the Elem objects.  toks_.Clear() just clears them from the hash and gives ownership
   // to the caller, who then has to call toks_.Delete(e) for each one.  It was designed
   // this way for convenience in propagating tokens from one frame to the next.
   void ClearToks(Elem *list);

   KALDI_DISALLOW_COPY_AND_ASSIGN(FasterDecoder);
 };


 } // end namespace kaldi.


 #endif
kaldi::FasterDecoderOptions::beam
BaseFloat beam
Definition: faster-decoder.h:34

fst::StateId
fst::StdArc::StateId StateId
Definition: deterministic-fst-test.cc:58

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::FasterDecoderOptions::min_active
int32 min_active
Definition: faster-decoder.h:36

stl-utils.h

kaldi::FasterDecoder::Label
Arc::Label Label
Definition: faster-decoder.h:65

kaldi::FasterDecoder::Token::Token
Token(const Arc &arc, BaseFloat ac_cost, Token *prev)
Definition: faster-decoder.h:116

kaldi::DecodableInterface
DecodableInterface provides a link between the (acoustic-modeling and feature-processing) code and th...
Definition: decodable-itf.h:82

kaldi::FasterDecoder::SetOptions
void SetOptions(const FasterDecoderOptions &config)
Definition: faster-decoder.h:72

kaldi::FasterDecoder::config_
FasterDecoderOptions config_
Definition: faster-decoder.h:172

fst
For an extended explanation of the framework of which grammar-fsts are a part, please see Support for...
Definition: graph.dox:21

fst::StdArc
fst::StdArc StdArc
Definition: deterministic-fst-test.cc:56

kaldi::FasterDecoderOptions::max_active
int32 max_active
Definition: faster-decoder.h:35

kaldi::FasterDecoder::Token::Token
Token(const Arc &arc, Token *prev)
Definition: faster-decoder.h:125

kaldi::full
Definition: regtree-fmllr-diag-gmm-test.cc:59

kaldi::FasterDecoderOptions::beam_delta
BaseFloat beam_delta
Definition: faster-decoder.h:37

hash-list.h

kaldi::FasterDecoderOptions::hash_ratio
BaseFloat hash_ratio
Definition: faster-decoder.h:38

kaldi::FasterDecoder::Arc
fst::StdArc Arc
Definition: faster-decoder.h:64

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

KALDI_DISALLOW_COPY_AND_ASSIGN
#define KALDI_DISALLOW_COPY_AND_ASSIGN(type)
Definition: kaldi-utils.h:121

kaldi::FasterDecoder::Token::ref_count_
int32 ref_count_
Definition: faster-decoder.h:112

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi-lattice.h

options-itf.h

kaldi::FasterDecoder::Token::TokenDelete
static void TokenDelete(Token *tok)
Definition: faster-decoder.h:138

kaldi::FasterDecoder::fst_
const fst::Fst< fst::StdArc > & fst_
Definition: faster-decoder.h:171

kaldi::FasterDecoder
Definition: faster-decoder.h:62

float

kaldi::HashList
Definition: hash-list.h:50

kaldi::FasterDecoder::Token
Definition: faster-decoder.h:106

kaldi::FasterDecoder::Token::prev_
Token * prev_
Definition: faster-decoder.h:111

decodable-itf.h

kaldi::FasterDecoderOptions::Register
void Register(OptionsItf *opts, bool full)
Definition: faster-decoder.h:45

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::FasterDecoder::toks_
HashList< StateId, Token * > toks_
Definition: faster-decoder.h:170

fst::Label
fst::StdArc::Label Label
Definition: deterministic-fst-test.cc:57

fst::Weight
fst::StdArc::Weight Weight
Definition: deterministic-fst-test.cc:60

kaldi::FasterDecoder::NumFramesDecoded
int32 NumFramesDecoded() const
Returns the number of frames already decoded.
Definition: faster-decoder.h:102

operator<
bool operator<(const Int32Pair &a, const Int32Pair &b)
Definition: cu-matrixdim.h:83

kaldi::FasterDecoderOptions::FasterDecoderOptions
FasterDecoderOptions()
Definition: faster-decoder.h:39

kaldi::FasterDecoder::Token::cost_
double cost_
Definition: faster-decoder.h:115

kaldi::FasterDecoder::Elem
HashList< StateId, Token * >::Elem Elem
Definition: faster-decoder.h:150

kaldi::FasterDecoder::Token::arc_
Arc arc_
Definition: faster-decoder.h:108

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::FasterDecoderOptions
Definition: faster-decoder.h:33

kaldi::FasterDecoder::num_frames_decoded_
int32 num_frames_decoded_
Definition: faster-decoder.h:178

kaldi::HashList::Elem
Definition: hash-list.h:52

kaldi::FasterDecoder::tmp_array_
std::vector< BaseFloat > tmp_array_
Definition: faster-decoder.h:174

kaldi::FasterDecoder::StateId
Arc::StateId StateId
Definition: faster-decoder.h:66

kaldi::FasterDecoder::Weight
Arc::Weight Weight
Definition: faster-decoder.h:67

kaldi::FasterDecoder::~FasterDecoder
~FasterDecoder()
Definition: faster-decoder.h:74

kaldi::FasterDecoder::queue_
std::vector< const Elem *> queue_
Definition: faster-decoder.h:173