doc/hmm-utils_8h_source.html

 // hmm/hmm-utils.h

 // Copyright 2009-2011  Microsoft Corporation

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_HMM_HMM_UTILS_H_
 #define KALDI_HMM_HMM_UTILS_H_

 #include "hmm/hmm-topology.h"
 #include "hmm/transition-model.h"
 #include "lat/kaldi-lattice.h"

 namespace kaldi {


 struct HTransducerConfig {
   BaseFloat transition_scale;
   int32 nonterm_phones_offset;

   HTransducerConfig():
       transition_scale(1.0),
       nonterm_phones_offset(-1) { }

   void Register (OptionsItf *opts) {
     opts->Register("transition-scale", &transition_scale,
                    "Scale of transition probs (relative to LM)");
     opts->Register("nonterm-phones-offset", &nonterm_phones_offset,
                    "The integer id of #nonterm_bos in phones.txt, if present. "
                    "Only needs to be set if you are doing grammar decoding, "
                    "see doc/grammar.dox.");
   }
 };


 struct HmmCacheHash {
   int operator () (const std::pair<int32, std::vector<int32> >&p) const {
     VectorHasher<int32> v;
     int32 prime = 103049;
     return prime*p.first + v(p.second);
   }
 };

 typedef unordered_map<std::pair<int32, std::vector<int32> >,
                       fst::VectorFst<fst::StdArc>*,
                       HmmCacheHash> HmmCacheType;


 fst::VectorFst<fst::StdArc> *GetHmmAsFsa(
     std::vector<int32> context_window,
     const ContextDependencyInterface &ctx_dep,
     const TransitionModel &trans_model,
     const HTransducerConfig &config,
     HmmCacheType *cache = NULL);


 fst::VectorFst<fst::StdArc>*
 GetHmmAsFsaSimple(std::vector<int32> context_window,
                   const ContextDependencyInterface &ctx_dep,
                   const TransitionModel &trans_model,
                   BaseFloat prob_scale);


 fst::VectorFst<fst::StdArc>*
 GetHTransducer(const std::vector<std::vector<int32> > &ilabel_info,
                const ContextDependencyInterface &ctx_dep,
                const TransitionModel &trans_model,
                const HTransducerConfig &config,
                std::vector<int32> *disambig_syms_left);

 void GetIlabelMapping(const std::vector<std::vector<int32> > &ilabel_info_old,
                       const ContextDependencyInterface &ctx_dep,
                       const TransitionModel &trans_model,
                       std::vector<int32> *old2new_map);


 void AddSelfLoops(const TransitionModel &trans_model,
                   const std::vector<int32> &disambig_syms,  // used as a check only.
                   BaseFloat self_loop_scale,
                   bool reorder,
                   bool check_no_self_loops,
                   fst::VectorFst<fst::StdArc> *fst);

 void AddTransitionProbs(const TransitionModel &trans_model,
                         const std::vector<int32> &disambig_syms,
                         BaseFloat transition_scale,
                         BaseFloat self_loop_scale,
                         fst::VectorFst<fst::StdArc> *fst);

 void AddTransitionProbs(const TransitionModel &trans_model,
                         BaseFloat transition_scale,
                         BaseFloat self_loop_scale,
                         Lattice *lat);


 fst::VectorFst<fst::StdArc>*
 GetPdfToTransitionIdTransducer(const TransitionModel &trans_model);

 void ConvertTransitionIdsToPdfs(const TransitionModel &trans_model,
                                 const std::vector<int32> &disambig_syms,
                                 fst::VectorFst<fst::StdArc> *fst);


 bool SplitToPhones(const TransitionModel &trans_model,
                    const std::vector<int32> &alignment,
                    std::vector<std::vector<int32> > *split_alignment);

 bool ConvertAlignment(const TransitionModel &old_trans_model,
                       const TransitionModel &new_trans_model,
                       const ContextDependencyInterface &new_ctx_dep,
                       const std::vector<int32> &old_alignment,
                       int32 subsample_factor,  // 1 in the normal case -> no subsampling.
                       bool repeat_frames,
                       bool reorder,
                       const std::vector<int32> *phone_map,  // may be NULL
                       std::vector<int32> *new_alignment);

 // ConvertPhnxToProns is only needed in bin/phones-to-prons.cc and
 // isn't closely related with HMMs, but we put it here as there isn't
 // any other obvious place for it and it needs to be tested.
 // This function takes a phone-sequence with word-start and word-end
 // markers in it, and a word-sequence, and outputs the pronunciations
 // "prons"... the format of "prons" is, each element is a vector,
 // where the first element is the word (or zero meaning no word, e.g.
 // for optional silence introduced by the lexicon), and the remaining
 // elements are the phones in the word's pronunciation.
 // It returns false if it encounters a problem of some kind, e.g.
 // if the phone-sequence doesn't seem to have the right number of
 // words in it.
 bool ConvertPhnxToProns(const std::vector<int32> &phnx,
                         const std::vector<int32> &words,
                         int32 word_start_sym,
                         int32 word_end_sym,
                         std::vector<std::vector<int32> > *prons);


 /* Generates a random alignment for this phone, of length equal to
    alignment->size(), which is required to be at least the MinLength() of the
    topology for this phone, or this function will crash.
    The alignment will be without 'reordering'.
 */
 void GetRandomAlignmentForPhone(const ContextDependencyInterface &ctx_dep,
                                 const TransitionModel &trans_model,
                                 const std::vector<int32> &phone_window,
                                 std::vector<int32> *alignment);

 /*
   If the alignment was non-reordered makes it reordered, and vice versa.
 */
 void ChangeReorderingOfAlignment(const TransitionModel &trans_model,
                                  std::vector<int32> *alignment);


 // GetPdfToPhonesMap creates a map which maps each pdf-id into its
 // corresponding monophones.
 void GetPdfToPhonesMap(const TransitionModel &trans_model,
                        std::vector<std::set<int32> > *pdf2phones);


 } // end namespace kaldi


 #endif
words
int32 words[kMaxOrder]
Definition: arpa-file-parser-test.cc:43

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::VectorHasher
A hashing function-object for vectors.
Definition: stl-utils.h:216

kaldi::HTransducerConfig::Register
void Register(OptionsItf *opts)
Definition: hmm-utils.h:47

kaldi::GetRandomAlignmentForPhone
void GetRandomAlignmentForPhone(const ContextDependencyInterface &ctx_dep, const TransitionModel &trans_model, const std::vector< int32 > &phone_window, std::vector< int32 > *alignment)
Definition: hmm-utils.cc:1207

kaldi::ConvertPhnxToProns
bool ConvertPhnxToProns(const std::vector< int32 > &phnx, const std::vector< int32 > &words, int32 word_start_sym, int32 word_end_sym, std::vector< std::vector< int32 > > *prons)
Definition: hmm-utils.cc:1161

fst
For an extended explanation of the framework of which grammar-fsts are a part, please see Support for...
Definition: graph.dox:21

kaldi::AddSelfLoops
void AddSelfLoops(const TransitionModel &trans_model, const std::vector< int32 > &disambig_syms, BaseFloat self_loop_scale, bool reorder, bool check_no_self_loops, fst::VectorFst< fst::StdArc > *fst)
For context, see AddSelfLoops().
Definition: hmm-utils.cc:602

kaldi::GetIlabelMapping
void GetIlabelMapping(const std::vector< std::vector< int32 > > &ilabel_info_old, const ContextDependencyInterface &ctx_dep, const TransitionModel &trans_model, std::vector< int32 > *old2new_map)
GetIlabelMapping produces a mapping that&#39;s similar to HTK&#39;s logical-to-physical model mapping (i...
Definition: hmm-utils.cc:335

kaldi::HmmCacheType
unordered_map< std::pair< int32, std::vector< int32 > >, fst::VectorFst< fst::StdArc > *, HmmCacheHash > HmmCacheType
HmmCacheType is a map from (central-phone, sequence of pdf-ids) to FST, used as cache in GetHmmAsFsa...
Definition: hmm-utils.h:70

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::HTransducerConfig::nonterm_phones_offset
int32 nonterm_phones_offset
Definition: hmm-utils.h:41

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi::TransitionModel
Definition: transition-model.h:123

kaldi-lattice.h

kaldi::SplitToPhones
bool SplitToPhones(const TransitionModel &trans_model, const std::vector< int32 > &alignment, std::vector< std::vector< int32 > > *split_alignment)
SplitToPhones splits up the TransitionIds in "alignment" into their individual phones (one vector per...
Definition: hmm-utils.cc:723

kaldi::HTransducerConfig
Configuration class for the GetHTransducer() function; see The HTransducerConfig configuration class ...
Definition: hmm-utils.h:36

kaldi::AddTransitionProbs
void AddTransitionProbs(const TransitionModel &trans_model, const std::vector< int32 > &disambig_syms, BaseFloat transition_scale, BaseFloat self_loop_scale, fst::VectorFst< fst::StdArc > *fst)
Adds transition-probs, with the supplied scales (see Scaling of transition and acoustic probabilities...
Definition: hmm-utils.cc:1088

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::GetPdfToPhonesMap
void GetPdfToPhonesMap(const TransitionModel &trans_model, std::vector< std::set< int32 > > *pdf2phones)
Definition: hmm-utils.cc:1292

float

transition-model.h

kaldi::Lattice
fst::VectorFst< LatticeArc > Lattice
Definition: kaldi-lattice.h:44

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::GetHTransducer
fst::VectorFst< fst::StdArc > * GetHTransducer(const std::vector< std::vector< int32 > > &ilabel_info, const ContextDependencyInterface &ctx_dep, const TransitionModel &trans_model, const HTransducerConfig &config, std::vector< int32 > *disambig_syms_left)
Returns the H tranducer; result owned by caller.
Definition: hmm-utils.cc:254

kaldi::HmmCacheHash
Definition: hmm-utils.h:58

kaldi::ContextDependencyInterface
context-dep-itf.h provides a link between the tree-building code in ../tree/, and the FST code in ...
Definition: context-dep-itf.h:34

kaldi::HTransducerConfig::transition_scale
BaseFloat transition_scale
Transition log-prob scale, see Scaling of transition and acoustic probabilities.
Definition: hmm-utils.h:40

kaldi::GetHmmAsFsa
fst::VectorFst< fst::StdArc > * GetHmmAsFsa(std::vector< int32 > phone_window, const ContextDependencyInterface &ctx_dep, const TransitionModel &trans_model, const HTransducerConfig &config, HmmCacheType *cache)
Called by GetHTransducer() and probably will not need to be called directly; it creates and returns t...
Definition: hmm-utils.cc:32

kaldi::ConvertTransitionIdsToPdfs
void ConvertTransitionIdsToPdfs(const TransitionModel &trans_model, const std::vector< int32 > &disambig_syms, fst::VectorFst< fst::StdArc > *fst)
Converts all transition-ids in the FST to pdfs plus one.

hmm-topology.h

kaldi::ChangeReorderingOfAlignment
void ChangeReorderingOfAlignment(const TransitionModel &trans_model, std::vector< int32 > *alignment)
Definition: hmm-utils.cc:1260

kaldi::HTransducerConfig::HTransducerConfig
HTransducerConfig()
Definition: hmm-utils.h:43

kaldi::ConvertAlignment
bool ConvertAlignment(const TransitionModel &old_trans_model, const TransitionModel &new_trans_model, const ContextDependencyInterface &new_ctx_dep, const std::vector< int32 > &old_alignment, int32 subsample_factor, bool repeat_frames, bool new_is_reordered, const std::vector< int32 > *phone_map, std::vector< int32 > *new_alignment)
ConvertAlignment converts an alignment that was created using one model, to another model...
Definition: hmm-utils.cc:1013

kaldi::GetHmmAsFsaSimple
fst::VectorFst< fst::StdArc > * GetHmmAsFsaSimple(std::vector< int32 > phone_window, const ContextDependencyInterface &ctx_dep, const TransitionModel &trans_model, BaseFloat prob_scale)
Included mainly as a form of documentation, not used in any other code currently. ...
Definition: hmm-utils.cc:155

kaldi::GetPdfToTransitionIdTransducer
fst::VectorFst< fst::StdArc > * GetPdfToTransitionIdTransducer(const TransitionModel &trans_model)
Returns a transducer from pdfs plus one (input) to transition-ids (output).
Definition: hmm-utils.cc:407