doc/decodable-matrix_8h_source.html

 // decoder/decodable-matrix.h

 // Copyright 2009-2011  Microsoft Corporation
 //                2013  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_DECODER_DECODABLE_MATRIX_H_
 #define KALDI_DECODER_DECODABLE_MATRIX_H_

 #include <vector>

 #include "base/kaldi-common.h"
 #include "hmm/transition-model.h"
 #include "itf/decodable-itf.h"
 #include "matrix/kaldi-matrix.h"

 namespace kaldi {


 class DecodableMatrixScaledMapped: public DecodableInterface {
  public:
   // This constructor creates an object that will not delete "likes" when done.
   DecodableMatrixScaledMapped(const TransitionModel &tm,
                               const Matrix<BaseFloat> &likes,
                               BaseFloat scale): trans_model_(tm), likes_(&likes),
                                                 scale_(scale), delete_likes_(false) {
     if (likes.NumCols() != tm.NumPdfs())
       KALDI_ERR << "DecodableMatrixScaledMapped: mismatch, matrix has "
                 << likes.NumCols() << " cols but transition-model has "
                 << tm.NumPdfs() << " pdf-ids.";
   }

   // This constructor creates an object that will delete "likes"
   // when done.
   DecodableMatrixScaledMapped(const TransitionModel &tm,
                               BaseFloat scale,
                               const Matrix<BaseFloat> *likes):
       trans_model_(tm), likes_(likes),
       scale_(scale), delete_likes_(true) {
     if (likes->NumCols() != tm.NumPdfs())
       KALDI_ERR << "DecodableMatrixScaledMapped: mismatch, matrix has "
                 << likes->NumCols() << " cols but transition-model has "
                 << tm.NumPdfs() << " pdf-ids.";
   }

   virtual int32 NumFramesReady() const { return likes_->NumRows(); }

   virtual bool IsLastFrame(int32 frame) const {
     KALDI_ASSERT(frame < NumFramesReady());
     return (frame == NumFramesReady() - 1);
   }

   // Note, frames are numbered from zero.
   virtual BaseFloat LogLikelihood(int32 frame, int32 tid) {
     return scale_ * (*likes_)(frame, trans_model_.TransitionIdToPdfFast(tid));
   }

   // Indices are one-based!  This is for compatibility with OpenFst.
   virtual int32 NumIndices() const { return trans_model_.NumTransitionIds(); }

   virtual ~DecodableMatrixScaledMapped() {
     if (delete_likes_) delete likes_;
   }
  private:
   const TransitionModel &trans_model_;  // for tid to pdf mapping
   const Matrix<BaseFloat> *likes_;
   BaseFloat scale_;
   bool delete_likes_;
   KALDI_DISALLOW_COPY_AND_ASSIGN(DecodableMatrixScaledMapped);
 };

 class DecodableMatrixMapped: public DecodableInterface {
  public:
   // This constructor creates an object that will not delete "likes" when done.
   // the frame_offset is the frame the row 0 of 'likes' corresponds to, would be
   // greater than one if this is not the first chunk of likelihoods.
   DecodableMatrixMapped(const TransitionModel &tm,
                         const MatrixBase<BaseFloat> &likes,
                         int32 frame_offset = 0);

   // This constructor creates an object that will delete "likes"
   // when done.
   DecodableMatrixMapped(const TransitionModel &tm,
                         const Matrix<BaseFloat> *likes,
                         int32 frame_offset = 0);

   virtual int32 NumFramesReady() const;

   virtual bool IsLastFrame(int32 frame) const;

   virtual BaseFloat LogLikelihood(int32 frame, int32 tid);

   // Note: these indices are 1-based.
   virtual int32 NumIndices() const;

   virtual ~DecodableMatrixMapped();

  private:
   const TransitionModel &trans_model_;  // for tid to pdf mapping
   const MatrixBase<BaseFloat> *likes_;
   const Matrix<BaseFloat> *likes_to_delete_;
   int32 frame_offset_;

   // raw_data_ and stride_ are a kind of fast look-aside for 'likes_', to be
   // used when KALDI_PARANOID is false.
   const BaseFloat *raw_data_;
   int32 stride_;

   KALDI_DISALLOW_COPY_AND_ASSIGN(DecodableMatrixMapped);
 };


 class DecodableMatrixMappedOffset: public DecodableInterface {
  public:
   DecodableMatrixMappedOffset(const TransitionModel &tm):
       trans_model_(tm), frame_offset_(0), input_is_finished_(false) { }

   // this is not part of the generic Decodable interface.
   int32 FirstAvailableFrame() const { return frame_offset_; }

   // Logically, this function appends 'loglikes' (interpreted as newly available
   // frames) to the log-likelihoods stored in the class.
   //
   // This function is destructive of the input "loglikes" because it may
   // under some circumstances do a shallow copy using Swap().  This function
   // appends loglikes to any existing likelihoods you've previously supplied.
   void AcceptLoglikes(Matrix<BaseFloat> *loglikes,
                       int32 frames_to_discard);

   void InputIsFinished() { input_is_finished_ = true; }

   virtual int32 NumFramesReady() const {
     return loglikes_.NumRows() + frame_offset_;
   }

   virtual bool IsLastFrame(int32 frame) const {
     KALDI_ASSERT(frame < NumFramesReady());
     return (frame == NumFramesReady() - 1 && input_is_finished_);
   }

   virtual BaseFloat LogLikelihood(int32 frame, int32 tid) {
     int32 pdf_id = trans_model_.TransitionIdToPdfFast(tid);
 #ifdef KALDI_PARANOID
     return loglikes_(frame - frame_offset_, pdf_id);
 #else
     // This does no checking, so will be faster.
     return raw_data_[frame * stride_ + pdf_id];
 #endif
   }

   virtual int32 NumIndices() const { return trans_model_.NumTransitionIds(); }

   // nothing special to do in destructor.
   virtual ~DecodableMatrixMappedOffset() { }
  private:
   const TransitionModel &trans_model_;  // for tid to pdf mapping
   Matrix<BaseFloat> loglikes_;
   int32 frame_offset_;
   bool input_is_finished_;

   // 'raw_data_' and 'stride_' are intended as a fast look-aside which is an
   // alternative to accessing data_.  raw_data_ is a faked version of
   // data_->Data() as if it started from frame zero rather than frame_offset_.
   // This simplifies the code of LogLikelihood(), in cases where KALDI_PARANOID
   // is not defined.
   BaseFloat *raw_data_;
   int32 stride_;

   KALDI_DISALLOW_COPY_AND_ASSIGN(DecodableMatrixMappedOffset);
 };


 class DecodableMatrixScaled: public DecodableInterface {
  public:
   DecodableMatrixScaled(const Matrix<BaseFloat> &likes,
                         BaseFloat scale):
     likes_(likes), scale_(scale) { }

   virtual int32 NumFramesReady() const { return likes_.NumRows(); }

   virtual bool IsLastFrame(int32 frame) const {
     KALDI_ASSERT(frame < NumFramesReady());
     return (frame == NumFramesReady() - 1);
   }

   // Note, frames are numbered from zero.
   virtual BaseFloat LogLikelihood(int32 frame, int32 index) {
     if (index > likes_.NumCols() || index <= 0 ||
         frame < 0 || frame >= likes_.NumRows())
       KALDI_ERR << "Invalid (frame, index - 1) = ("
                 << frame << ", " << index - 1 << ") for matrix of size "
                 << likes_.NumRows() << " x " << likes_.NumCols();
     return scale_ * likes_(frame, index - 1);
   }

   // Indices are one-based!  This is for compatibility with OpenFst.
   virtual int32 NumIndices() const { return likes_.NumCols(); }

  private:
   const Matrix<BaseFloat> &likes_;
   BaseFloat scale_;
   KALDI_DISALLOW_COPY_AND_ASSIGN(DecodableMatrixScaled);
 };
 }  // namespace kaldi

 #endif  // KALDI_DECODER_DECODABLE_MATRIX_H_
kaldi::DecodableMatrixMapped::trans_model_
const TransitionModel & trans_model_
Definition: decodable-matrix.h:125

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::DecodableMatrixMappedOffset::NumFramesReady
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
Definition: decodable-matrix.h:171

kaldi::DecodableMatrixScaledMapped::NumFramesReady
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
Definition: decodable-matrix.h:60

kaldi::DecodableMatrixScaled::LogLikelihood
virtual BaseFloat LogLikelihood(int32 frame, int32 index)
Returns the log likelihood, which will be negated in the decoder.
Definition: decodable-matrix.h:226

kaldi::DecodableMatrixScaledMapped::KALDI_DISALLOW_COPY_AND_ASSIGN
KALDI_DISALLOW_COPY_AND_ASSIGN(DecodableMatrixScaledMapped)

kaldi::DecodableInterface
DecodableInterface provides a link between the (acoustic-modeling and feature-processing) code and th...
Definition: decodable-itf.h:82

kaldi::DecodableMatrixMappedOffset::NumIndices
virtual int32 NumIndices() const
Returns the number of states in the acoustic model (they will be indexed one-based, i.e.
Definition: decodable-matrix.h:190

kaldi::DecodableMatrixScaled::DecodableMatrixScaled
DecodableMatrixScaled(const Matrix< BaseFloat > &likes, BaseFloat scale)
Definition: decodable-matrix.h:214

kaldi::DecodableMatrixScaledMapped::trans_model_
const TransitionModel & trans_model_
Definition: decodable-matrix.h:79

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::DecodableMatrixMappedOffset::InputIsFinished
void InputIsFinished()
Definition: decodable-matrix.h:169

kaldi::TransitionModel::TransitionIdToPdfFast
int32 TransitionIdToPdfFast(int32 trans_id) const
Definition: transition-model.h:334

kaldi::MatrixBase
Base class which provides matrix operations not involving resizing or allocation. ...
Definition: kaldi-matrix.h:49

kaldi::DecodableMatrixMapped::frame_offset_
int32 frame_offset_
Definition: decodable-matrix.h:128

kaldi-matrix.h

kaldi::DecodableMatrixMappedOffset::~DecodableMatrixMappedOffset
virtual ~DecodableMatrixMappedOffset()
Definition: decodable-matrix.h:193

kaldi::DecodableMatrixMapped::raw_data_
const BaseFloat * raw_data_
Definition: decodable-matrix.h:132

kaldi::DecodableMatrixScaledMapped::~DecodableMatrixScaledMapped
virtual ~DecodableMatrixScaledMapped()
Definition: decodable-matrix.h:75

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::Matrix< BaseFloat >

kaldi::DecodableMatrixMapped::likes_to_delete_
const Matrix< BaseFloat > * likes_to_delete_
Definition: decodable-matrix.h:127

kaldi::DecodableMatrixScaled::IsLastFrame
virtual bool IsLastFrame(int32 frame) const
Returns true if this is the last frame.
Definition: decodable-matrix.h:220

kaldi::DecodableMatrixMappedOffset::raw_data_
BaseFloat * raw_data_
Definition: decodable-matrix.h:205

kaldi::DecodableMatrixMappedOffset
This decodable class returns log-likes stored in a matrix; it supports repeatedly writing to the matr...
Definition: decodable-matrix.h:152

kaldi::TransitionModel
Definition: transition-model.h:123

kaldi::DecodableMatrixMappedOffset::input_is_finished_
bool input_is_finished_
Definition: decodable-matrix.h:198

kaldi::DecodableMatrixScaledMapped::scale_
BaseFloat scale_
Definition: decodable-matrix.h:81

kaldi::DecodableMatrixMappedOffset::frame_offset_
int32 frame_offset_
Definition: decodable-matrix.h:197

kaldi::DecodableMatrixScaledMapped::DecodableMatrixScaledMapped
DecodableMatrixScaledMapped(const TransitionModel &tm, BaseFloat scale, const Matrix< BaseFloat > *likes)
Definition: decodable-matrix.h:49

kaldi::DecodableMatrixScaledMapped::DecodableMatrixScaledMapped
DecodableMatrixScaledMapped(const TransitionModel &tm, const Matrix< BaseFloat > &likes, BaseFloat scale)
Definition: decodable-matrix.h:37

float

transition-model.h

kaldi::TransitionModel::NumTransitionIds
int32 NumTransitionIds() const
Returns the total number of transition-ids (note, these are one-based).
Definition: transition-model.h:175

kaldi::DecodableMatrixScaledMapped::delete_likes_
bool delete_likes_
Definition: decodable-matrix.h:82

kaldi::DecodableMatrixScaled::scale_
BaseFloat scale_
Definition: decodable-matrix.h:240

kaldi::DecodableMatrixScaled::likes_
const Matrix< BaseFloat > & likes_
Definition: decodable-matrix.h:239

kaldi::DecodableMatrixMapped::stride_
int32 stride_
Definition: decodable-matrix.h:133

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::DecodableMatrixMappedOffset::FirstAvailableFrame
int32 FirstAvailableFrame() const
Definition: decodable-matrix.h:158

kaldi::DecodableMatrixScaled::NumIndices
virtual int32 NumIndices() const
Returns the number of states in the acoustic model (they will be indexed one-based, i.e.
Definition: decodable-matrix.h:236

decodable-itf.h

kaldi::DecodableMatrixScaledMapped::IsLastFrame
virtual bool IsLastFrame(int32 frame) const
Returns true if this is the last frame.
Definition: decodable-matrix.h:62

kaldi::DecodableMatrixScaledMapped::LogLikelihood
virtual BaseFloat LogLikelihood(int32 frame, int32 tid)
Returns the log likelihood, which will be negated in the decoder.
Definition: decodable-matrix.h:68

kaldi::DecodableMatrixScaledMapped::likes_
const Matrix< BaseFloat > * likes_
Definition: decodable-matrix.h:80

kaldi::DecodableMatrixScaled
Definition: decodable-matrix.h:212

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::DecodableMatrixMapped::likes_
const MatrixBase< BaseFloat > * likes_
Definition: decodable-matrix.h:126

kaldi::DecodableMatrixMappedOffset::IsLastFrame
virtual bool IsLastFrame(int32 frame) const
Returns true if this is the last frame.
Definition: decodable-matrix.h:175

kaldi::DecodableMatrixMappedOffset::trans_model_
const TransitionModel & trans_model_
Definition: decodable-matrix.h:195

kaldi::DecodableMatrixMapped
This is like DecodableMatrixScaledMapped, but it doesn&#39;t support an acoustic scale, and it does support a frame offset, whereby you can state that the first row of &#39;likes&#39; is actually the n&#39;th row of the matrix of available log-likelihoods.
Definition: decodable-matrix.h:98

kaldi::DecodableMatrixScaledMapped
Definition: decodable-matrix.h:34

kaldi::DecodableMatrixMappedOffset::DecodableMatrixMappedOffset
DecodableMatrixMappedOffset(const TransitionModel &tm)
Definition: decodable-matrix.h:154

kaldi::DecodableMatrixScaled::NumFramesReady
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
Definition: decodable-matrix.h:218

kaldi-common.h

kaldi::DecodableMatrixMappedOffset::LogLikelihood
virtual BaseFloat LogLikelihood(int32 frame, int32 tid)
Returns the log likelihood, which will be negated in the decoder.
Definition: decodable-matrix.h:180

kaldi::TransitionModel::NumPdfs
int32 NumPdfs() const
Definition: transition-model.h:190

kaldi::DecodableMatrixScaledMapped::NumIndices
virtual int32 NumIndices() const
Returns the number of states in the acoustic model (they will be indexed one-based, i.e.
Definition: decodable-matrix.h:73

kaldi::DecodableMatrixMappedOffset::loglikes_
Matrix< BaseFloat > loglikes_
Definition: decodable-matrix.h:196

kaldi::DecodableMatrixMappedOffset::stride_
int32 stride_
Definition: decodable-matrix.h:206