22 #ifndef KALDI_TRANSFORM_DECODABLE_AM_DIAG_GMM_REGTREE_H_ 23 #define KALDI_TRANSFORM_DECODABLE_AM_DIAG_GMM_REGTREE_H_ 141 #endif // KALDI_TRANSFORM_DECODABLE_AM_DIAG_GMM_REGTREE_H_
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
KALDI_DISALLOW_COPY_AND_ASSIGN(DecodableAmDiagGmmRegtreeFmllr)
DecodableAmDiagGmmUnmapped is a decodable object that takes indices that correspond to pdf-id's plus ...
std::vector< Vector< BaseFloat > > xformed_data_
An MLLR mean transformation is an affine transformation of Gaussian means.
virtual int32 NumIndices() const
Returns the number of states in the acoustic model (they will be indexed one-based, i.e.
int32 TransitionIdToPdfFast(int32 trans_id) const
virtual BaseFloat LogLikelihood(int32 frame, int32 tid)
Returns the log likelihood, which will be negated in the decoder.
Vector< BaseFloat > logdets_
const RegressionTree & regtree_
Vector< BaseFloat > data_squared_
Cache for fast likelihood calculation.
const TransitionModel & trans_model_
std::vector< Vector< BaseFloat > *> xformed_gconsts_
Cache of transformed gconsts for each state.
const TransitionModel * TransModel()
const RegtreeFmllrDiagGmm & fmllr_xform_
An FMLLR (feature-space MLLR) transformation, also called CMLLR (constrained MLLR) is an affine trans...
Vector< BaseFloat > data_squared_
Cached for fast likelihood calculation.
DecodableAmDiagGmmRegtreeFmllr(const AmDiagGmm &am, const TransitionModel &tm, const Matrix< BaseFloat > &feats, const RegtreeFmllrDiagGmm &fmllr_xform, const RegressionTree ®tree, BaseFloat scale, BaseFloat log_sum_exp_prune=-1.0)
int32 NumTransitionIds() const
Returns the total number of transition-ids (note, these are one-based).
std::vector< Vector< BaseFloat > > xformed_data_squared_
virtual int32 NumIndices() const
Returns the number of states in the acoustic model (they will be indexed one-based, i.e.
A regression tree is a clustering of Gaussian densities in an acoustic model, such that the group of ...
std::vector< Matrix< BaseFloat > *> xformed_mean_invvars_
Cache of transformed means time inverse variances for each state.
const RegtreeMllrDiagGmm & mllr_xform_
virtual BaseFloat LogLikelihood(int32 frame, int32 tid)
Returns the log likelihood, which will be negated in the decoder.
const Matrix< BaseFloat > & feature_matrix_
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
const TransitionModel * TransModel()
A class representing a vector.
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
DecodableAmDiagGmmRegtreeMllr(const AmDiagGmm &am, const TransitionModel &tm, const Matrix< BaseFloat > &feats, const RegtreeMllrDiagGmm &mllr_xform, const RegressionTree ®tree, BaseFloat scale, BaseFloat log_sum_exp_prune=-1.0)
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
virtual BaseFloat LogLikelihoodZeroBased(int32 frame, int32 state_index)
const RegressionTree & regtree_
std::vector< bool > is_cached_
Boolean variable per state to indicate whether the transformed means for that state are cached...
const TransitionModel & trans_model_