doc/online-nnet3-incremental-decoding_8h_source.html

 // online2/online-nnet3-incremental-decoding.h

 // Copyright      2019  Zhehuai Chen

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_ONLINE2_ONLINE_NNET3_INCREMENTAL_DECODING_H_
 #define KALDI_ONLINE2_ONLINE_NNET3_INCREMENTAL_DECODING_H_

 #include <string>
 #include <vector>
 #include <deque>

 #include "nnet3/decodable-online-looped.h"
 #include "matrix/matrix-lib.h"
 #include "util/common-utils.h"
 #include "base/kaldi-error.h"
 #include "itf/online-feature-itf.h"
 #include "online2/online-endpoint.h"
 #include "online2/online-nnet2-feature-pipeline.h"
 #include "decoder/lattice-incremental-online-decoder.h"
 #include "hmm/transition-model.h"
 #include "hmm/posterior.h"

 namespace kaldi {


 template <typename FST>
 class SingleUtteranceNnet3IncrementalDecoderTpl {
  public:

   // Constructor. The pointer 'features' is not being given to this class to own
   // and deallocate, it is owned externally.
   SingleUtteranceNnet3IncrementalDecoderTpl(const LatticeIncrementalDecoderConfig &decoder_opts,
                                             const TransitionModel &trans_model,
                                             const nnet3::DecodableNnetSimpleLoopedInfo &info,
                                             const FST &fst,
                                             OnlineNnet2FeaturePipeline *features);

   void InitDecoding(int32 frame_offset = 0);

   void AdvanceDecoding();

   void FinalizeDecoding() { decoder_.FinalizeDecoding(); }

   int32 NumFramesDecoded() const { return decoder_.NumFramesDecoded(); }

   int32 NumFramesInLattice() const { return decoder_.NumFramesInLattice(); }

   /* Gets the lattice.  The output lattice has any acoustic scaling in it
      (which will typically be desirable in an online-decoding context); if you
      want an un-scaled lattice, scale it using ScaleLattice() with the inverse
      of the acoustic weight.

          @param [in] num_frames_to_include  The number of frames you want
                   to be included in the lattice.  Must be in the range
                   [NumFramesInLattice().. NumFramesDecoded()].  If you
                   make it a few frames less than NumFramesDecoded(), it
                   will save significant computation.
          @param [in] use_final_probs   True if you want the lattice to
                   contain final-probs (if at least one state was final
                   on the most recently decoded frame).  Must be false
                   if num_frames_to_include < NumFramesDecoded().
                   Must be true if you have previously called
                   FinalizeDecoding().
   */
   const CompactLattice &GetLattice(int32 num_frames_to_include,
                                       bool use_final_probs = false) {
     return decoder_.GetLattice(num_frames_to_include, use_final_probs);
   }


   void GetBestPath(bool end_of_utterance,
                    Lattice *best_path) const;


   bool EndpointDetected(const OnlineEndpointConfig &config);

   const LatticeIncrementalOnlineDecoderTpl<FST> &Decoder() const { return decoder_; }

   ~SingleUtteranceNnet3IncrementalDecoderTpl() { }
  private:

   const LatticeIncrementalDecoderConfig &decoder_opts_;

   // this is remembered from the constructor; it's ultimately
   // derived from calling FrameShiftInSeconds() on the feature pipeline.
   BaseFloat input_feature_frame_shift_in_seconds_;

   // we need to keep a reference to the transition model around only because
   // it's needed by the endpointing code.
   const TransitionModel &trans_model_;

   nnet3::DecodableAmNnetLoopedOnline decodable_;

   LatticeIncrementalOnlineDecoderTpl<FST> decoder_;

 };


 typedef SingleUtteranceNnet3IncrementalDecoderTpl<fst::Fst<fst::StdArc> > SingleUtteranceNnet3IncrementalDecoder;


 }  // namespace kaldi


 #endif  // KALDI_ONLINE2_ONLINE_NNET3_DECODING_H_
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

matrix-lib.h

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::~SingleUtteranceNnet3IncrementalDecoderTpl
~SingleUtteranceNnet3IncrementalDecoderTpl()
Definition: online-nnet3-incremental-decoding.h:120

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::SingleUtteranceNnet3IncrementalDecoderTpl
SingleUtteranceNnet3IncrementalDecoderTpl(const LatticeIncrementalDecoderConfig &decoder_opts, const TransitionModel &trans_model, const nnet3::DecodableNnetSimpleLoopedInfo &info, const FST &fst, OnlineNnet2FeaturePipeline *features)
Definition: online-nnet3-incremental-decoding.cc:28

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::GetLattice
const CompactLattice & GetLattice(int32 num_frames_to_include, bool use_final_probs=false)
Definition: online-nnet3-incremental-decoding.h:97

kaldi::LatticeIncrementalOnlineDecoderTpl
LatticeIncrementalOnlineDecoderTpl is as LatticeIncrementalDecoderTpl but also supports an efficient ...
Definition: lattice-incremental-online-decoder.h:51

fst
For an extended explanation of the framework of which grammar-fsts are a part, please see Support for...
Definition: graph.dox:21

kaldi::nnet3::DecodableAmNnetLoopedOnline
Definition: decodable-online-looped.h:183

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::NumFramesInLattice
int32 NumFramesInLattice() const
Definition: online-nnet3-incremental-decoding.h:78

kaldi::OnlineEndpointConfig
Definition: online-endpoint.h:127

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::decoder_opts_
const LatticeIncrementalDecoderConfig & decoder_opts_
Definition: online-nnet3-incremental-decoding.h:123

posterior.h

online-nnet2-feature-pipeline.h
This file contains a different version of the feature-extraction pipeline in online-feature-pipeline...

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::decodable_
nnet3::DecodableAmNnetLoopedOnline decodable_
Definition: online-nnet3-incremental-decoding.h:133

kaldi::TransitionModel
Definition: transition-model.h:123

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::decoder_
LatticeIncrementalOnlineDecoderTpl< FST > decoder_
Definition: online-nnet3-incremental-decoding.h:135

decodable-online-looped.h

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::InitDecoding
void InitDecoding(int32 frame_offset=0)
Initializes the decoding and sets the frame offset of the underlying decodable object.
Definition: online-nnet3-incremental-decoding.cc:44

float

transition-model.h

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::AdvanceDecoding
void AdvanceDecoding()
Advances the decoding as far as we can.
Definition: online-nnet3-incremental-decoding.cc:50

kaldi::SingleUtteranceNnet3IncrementalDecoder
SingleUtteranceNnet3IncrementalDecoderTpl< fst::Fst< fst::StdArc > > SingleUtteranceNnet3IncrementalDecoder
Definition: online-nnet3-incremental-decoding.h:140

kaldi::Lattice
fst::VectorFst< LatticeArc > Lattice
Definition: kaldi-lattice.h:44

lattice-incremental-online-decoder.h

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::input_feature_frame_shift_in_seconds_
BaseFloat input_feature_frame_shift_in_seconds_
Definition: online-nnet3-incremental-decoding.h:127

kaldi::CompactLattice
fst::VectorFst< CompactLatticeArc > CompactLattice
Definition: kaldi-lattice.h:46

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::Decoder
const LatticeIncrementalOnlineDecoderTpl< FST > & Decoder() const
Definition: online-nnet3-incremental-decoding.h:118

online-feature-itf.h

kaldi::LatticeIncrementalDecoderConfig
The normal decoder, lattice-faster-decoder.h, sometimes has an issue when doing real-time application...
Definition: lattice-incremental-decoder.h:106

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::FinalizeDecoding
void FinalizeDecoding()
Finalizes the decoding.
Definition: online-nnet3-incremental-decoding.h:74

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::EndpointDetected
bool EndpointDetected(const OnlineEndpointConfig &config)
This function calls EndpointDetected from online-endpoint.h, with the required arguments.
Definition: online-nnet3-incremental-decoding.cc:61

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl
You will instantiate this class when you want to decode a single utterance using the online-decoding ...
Definition: online-nnet3-incremental-decoding.h:51

kaldi::OnlineNnet2FeaturePipeline
OnlineNnet2FeaturePipeline is a class that&#39;s responsible for putting together the various parts of th...
Definition: online-nnet2-feature-pipeline.h:198

online-endpoint.h

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::trans_model_
const TransitionModel & trans_model_
Definition: online-nnet3-incremental-decoding.h:131

kaldi::nnet3::DecodableNnetSimpleLoopedInfo
When you instantiate class DecodableNnetSimpleLooped, you should give it a const reference to this cl...
Definition: decodable-simple-looped.h:102

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::NumFramesDecoded
int32 NumFramesDecoded() const
Definition: online-nnet3-incremental-decoding.h:76

kaldi::SingleUtteranceNnet3IncrementalDecoderTpl::GetBestPath
void GetBestPath(bool end_of_utterance, Lattice *best_path) const
Outputs an FST corresponding to the single best path through the current lattice. ...
Definition: online-nnet3-incremental-decoding.cc:55

kaldi-error.h