doc/online-nnet2-decodable-test_8cc_source.html

 // nnet2/online-nnet2-decodable-test.cc

 // Copyright 2014  Johns Hopkins University (author:  Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "hmm/transition-model.h"
 #include "nnet2/nnet-component.h"
 #include "nnet2/decodable-am-nnet.h"
 #include "nnet2/online-nnet2-decodable.h"
 #include "feat/online-feature.h"
 #include "hmm/hmm-test-utils.h"

 namespace kaldi {
 namespace nnet2 {


 void UnitTestNnetDecodable() {
   std::vector<int32> phones;
   phones.push_back(1);
   for (int32 i = 2; i < 20; i++)
     if (rand() % 2 == 0)
       phones.push_back(i);
   int32 N = 2 + rand() % 2, // context-size N is 2 or 3.
       P = rand() % N;  // Central-phone is random on [0, N)

   std::vector<int32> num_pdf_classes;

   ContextDependency *ctx_dep =
       GenRandContextDependencyLarge(phones, N, P,
                                     true, &num_pdf_classes);

   HmmTopology topo = GetDefaultTopology(phones);

   TransitionModel trans_model(*ctx_dep, topo);

   delete ctx_dep; // We won't need this further.
   ctx_dep = NULL;

   int32 input_dim = 40, output_dim = trans_model.NumPdfs();
   Nnet *nnet = GenRandomNnet(input_dim, output_dim);

   AmNnet am_nnet(*nnet);
   delete nnet;
   nnet = NULL;
   Vector<BaseFloat> priors(output_dim);
   priors.SetRandn();
   priors.ApplyExp();
   priors.Scale(1.0 / priors.Sum());

   am_nnet.SetPriors(priors);

   DecodableNnet2OnlineOptions opts;
   opts.max_nnet_batch_size = 20;
   opts.acoustic_scale = 0.1;

   opts.pad_input = (rand() % 2 == 0);

   int32 num_input_frames = 400;
   Matrix<BaseFloat> input_feats(num_input_frames, input_dim);
   input_feats.SetRandn();

   OnlineMatrixFeature matrix_feature(input_feats);

   DecodableNnet2Online online_decodable(am_nnet, trans_model,
                                         opts, &matrix_feature);

   DecodableAmNnet offline_decodable(trans_model, am_nnet,
                                     CuMatrix<BaseFloat>(input_feats),
                                     opts.pad_input,
                                     opts.acoustic_scale);

   KALDI_ASSERT(online_decodable.NumFramesReady() ==
                offline_decodable.NumFramesReady());
   int32 num_frames = online_decodable.NumFramesReady(),
       num_tids = trans_model.NumTransitionIds();

   for (int32 i = 0; i < 50; i++) {

     int32 t = rand() % num_frames, tid = 1 + rand() % num_tids;
     BaseFloat l1 = online_decodable.LogLikelihood(t, tid),
         l2 = offline_decodable.LogLikelihood(t, tid);
     KALDI_ASSERT(ApproxEqual(l1, l2));
   }
 }

 } // namespace nnet2
 } // namespace kaldi


 int main() {
   using namespace kaldi;
   using namespace kaldi::nnet2;
   using kaldi::int32;

   for (int32 i = 0; i < 3; i++)
     UnitTestNnetDecodable();
   return 0;
 }


kaldi::OnlineMatrixFeature
This class takes a Matrix<BaseFloat> and wraps it as an OnlineFeatureInterface: this can be useful wh...
Definition: online-feature.h:167

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::VectorBase::ApplyExp
void ApplyExp()
Apply exponential to each value in vector.
Definition: kaldi-vector.cc:800

kaldi::GetDefaultTopology
HmmTopology GetDefaultTopology(const std::vector< int32 > &phones_in)
This function returns a HmmTopology object giving a normal 3-state topology, covering all phones in t...
Definition: hmm-test-utils.cc:50

decodable-am-nnet.h

kaldi::GenRandContextDependencyLarge
ContextDependency * GenRandContextDependencyLarge(const std::vector< int32 > &phone_ids, int N, int P, bool ensure_all_covered, std::vector< int32 > *hmm_lengths)
GenRandContextDependencyLarge is like GenRandContextDependency but generates a larger tree with speci...
Definition: context-dep.cc:97

kaldi::HmmTopology
A class for storing topology information for phones.
Definition: hmm-topology.h:93

kaldi::nnet2::AmNnet
Definition: am-nnet.h:38

kaldi::nnet2::GenRandomNnet
Nnet * GenRandomNnet(int32 input_dim, int32 output_dim)
This function generates a random neural net, for testing purposes.
Definition: nnet-nnet.cc:772

kaldi::nnet2::DecodableNnet2OnlineOptions::pad_input
bool pad_input
Definition: online-nnet2-decodable.h:39

online-feature.h

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::Matrix< BaseFloat >

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::nnet2::DecodableNnet2Online::NumFramesReady
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
Definition: online-nnet2-decodable.cc:66

kaldi::ContextDependency
Definition: context-dep.h:59

nnet-component.h

kaldi::TransitionModel
Definition: transition-model.h:123

main
int main()
Definition: online-nnet2-decodable-test.cc:104

online-nnet2-decodable.h

float

transition-model.h

kaldi::TransitionModel::NumTransitionIds
int32 NumTransitionIds() const
Returns the total number of transition-ids (note, these are one-based).
Definition: transition-model.h:175

kaldi::MatrixBase::SetRandn
void SetRandn()
Sets to random values of a normal distribution.
Definition: kaldi-matrix.cc:1355

kaldi::nnet2::Nnet
Definition: nnet-nnet.h:63

kaldi::nnet2::DecodableAmNnet::LogLikelihood
virtual BaseFloat LogLikelihood(int32 frame, int32 transition_id)
Returns the log likelihood, which will be negated in the decoder.
Definition: decodable-am-nnet.h:77

kaldi::nnet2::DecodableNnet2OnlineOptions
Definition: online-nnet2-decodable.h:37

kaldi::nnet2::DecodableNnet2Online
This Decodable object for class nnet2::AmNnet takes feature input from class OnlineFeatureInterface, unlike, say, class DecodableAmNnet which takes feature input from a matrix.
Definition: online-nnet2-decodable.h:68

kaldi::VectorBase::Scale
void Scale(Real alpha)
Multiplies all elements by this constant.
Definition: kaldi-vector.cc:963

kaldi::nnet2::DecodableAmNnet::NumFramesReady
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
Definition: decodable-am-nnet.h:82

kaldi::VectorBase::Sum
Real Sum() const
Returns sum of the elements.
Definition: kaldi-vector.cc:688

kaldi::VectorBase::SetRandn
void SetRandn()
Set vector to random normally-distributed noise.
Definition: kaldi-vector.cc:301

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet2::UnitTestNnetDecodable
void UnitTestNnetDecodable()
Definition: online-nnet2-decodable-test.cc:31

kaldi::nnet2::DecodableNnet2Online::LogLikelihood
virtual BaseFloat LogLikelihood(int32 frame, int32 index)
Returns the scaled log likelihood.
Definition: online-nnet2-decodable.cc:49

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet2::DecodableAmNnet
DecodableAmNnet is a decodable object that decodes with a neural net acoustic model of type AmNnet...
Definition: decodable-am-nnet.h:37

hmm-test-utils.h

kaldi::nnet2
Definition: am-nnet-test.cc:26

kaldi::nnet2::DecodableNnet2OnlineOptions::acoustic_scale
BaseFloat acoustic_scale
Definition: online-nnet2-decodable.h:38

kaldi::nnet2::AmNnet::SetPriors
void SetPriors(const VectorBase< BaseFloat > &priors)
Definition: am-nnet.cc:44

kaldi::nnet2::DecodableNnet2OnlineOptions::max_nnet_batch_size
int32 max_nnet_batch_size
Definition: online-nnet2-decodable.h:40

kaldi::ApproxEqual
static bool ApproxEqual(float a, float b, float relative_tolerance=0.001)
return abs(a - b) <= relative_tolerance * (abs(a)+abs(b)).
Definition: kaldi-math.h:265

kaldi::TransitionModel::NumPdfs
int32 NumPdfs() const
Definition: transition-model.h:190