doc/prob-to-post_8cc_source.html

 // bin/prob-to-post.cc

 // Copyright 2012  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "gmm/am-diag-gmm.h"
 #include "hmm/transition-model.h"
 #include "hmm/hmm-utils.h"
 #include "hmm/posterior.h"

 /* Convert a matrix probabilities
    to something of type Posterior, i.e. for each utterance, a
    vector<vector<pair<int32, BaseFloat> > >, which is a sparse representation
    of the probabilities.
    To avoid getting very tiny values making it non-sparse, we support
    thresholding, and this can either be done as a simple threshold, or (the
    default) a pseudo-random thing where you preserve the expectation, e.g.
    if the threshold is 0.01 and the value is 0.001, it will be zero with
    probability 0.9 and 0.01 with probability 0.1.
 */

 int main(int argc, char *argv[]) {
   using namespace kaldi;
   typedef kaldi::int32 int32;
   try {
     const char *usage =
         "Convert a matrix of probabilities (e.g. from nnet-logprob2) to posteriors\n"
         "Usage:  prob-to-post [options] <prob-matrix-rspecifier> <posteriors-wspecifier>\n"
         "e.g.:\n"
         " nnet-logprob2 [args] | prob-to-post ark:- ark:1.post\n"
         "Caution: in this particular example, the output would be posteriors of pdf-ids,\n"
         "rather than transition-ids (c.f. post-to-pdf-post)\n";

     ParseOptions po(usage);

     BaseFloat min_post = 0.01;
     bool random_prune = true; // preserve expectations.

     po.Register("min-post", &min_post, "Minimum posterior we will output (smaller "
                 "ones are pruned).  Also see --random-prune");
     po.Register("random-prune", &random_prune, "If true, prune posteriors with a "
                 "randomized method that preserves expectations.");

     po.Read(argc, argv);

     if (po.NumArgs() != 2) {
       po.PrintUsage();
       exit(1);
     }

     std::string prob_rspecifier = po.GetArg(1);
     std::string posteriors_wspecifier = po.GetArg(2);

     int32 num_done = 0;
     SequentialBaseFloatMatrixReader prob_reader(prob_rspecifier);
     PosteriorWriter posterior_writer(posteriors_wspecifier);

     for (; !prob_reader.Done(); prob_reader.Next()) {
       num_done++;
       const Matrix<BaseFloat> &probs = prob_reader.Value();
       // Posterior is vector<vector<pair<int32, BaseFloat> > >
       Posterior post(probs.NumRows());
       for (int32 i = 0; i < probs.NumRows(); i++) {
         SubVector<BaseFloat> row(probs, i);
         for (int32 j = 0; j < row.Dim(); j++) {
           BaseFloat p = row(j);
           if (p >= min_post) {
             post[i].push_back(std::make_pair(j, p));
           } else if (random_prune && (p / min_post) >= RandUniform()) {
             post[i].push_back(std::make_pair(j, min_post));
           }
         }
       }
       posterior_writer.Write(prob_reader.Key(), post);
     }
     KALDI_LOG << "Converted " << num_done << " log-prob matrices to posteriors.";
     return (num_done != 0 ? 0 : 1);
   } catch(const std::exception &e) {
     std::cerr << e.what();
     return -1;
   }
 }


am-diag-gmm.h

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::RandUniform
float RandUniform(struct RandomState *state=NULL)
Returns a random number strictly between 0 and 1.
Definition: kaldi-math.h:151

kaldi::ParseOptions::PrintUsage
void PrintUsage(bool print_command_line=false)
Prints the usage documentation [provided in the constructor].
Definition: parse-options.cc:393

kaldi::SequentialTableReader::Key
std::string Key()
Definition: kaldi-table-inl.h:918

hmm-utils.h

kaldi::TableWriter
A templated class for writing objects to an archive or script file; see The Table concept...
Definition: kaldi-table.h:368

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

kaldi::Matrix< BaseFloat >

posterior.h

kaldi::TableWriter::Write
void Write(const std::string &key, const T &value) const
Definition: kaldi-table-inl.h:1511

kaldi::ParseOptions::Register
void Register(const std::string &name, bool *ptr, const std::string &doc)
Definition: parse-options.cc:56

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::ParseOptions
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
Definition: parse-options.h:36

transition-model.h

kaldi::SequentialTableReader
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
Definition: kaldi-table.h:287

kaldi::ParseOptions::Read
int Read(int argc, const char *const *argv)
Parses the command line options and fills the ParseOptions-registered variables.
Definition: parse-options.cc:311

kaldi::SequentialTableReader::Done
bool Done()
Definition: kaldi-table-inl.h:948

kaldi::ParseOptions::GetArg
std::string GetArg(int param) const
Returns one of the positional parameters; 1-based indexing for argc/argv compatibility.
Definition: parse-options.cc:202

kaldi::SequentialTableReader::Next
void Next()
Definition: kaldi-table-inl.h:942

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::ParseOptions::NumArgs
int NumArgs() const
Number of positional parameters (c.f. argc-1).
Definition: parse-options.cc:198

kaldi::SequentialTableReader::Value
T & Value()
Definition: kaldi-table-inl.h:934

main
int main(int argc, char *argv[])
Definition: prob-to-post.cc:39

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi-common.h

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501