doc/feature-mfcc_8h_source.html

 // feat/feature-mfcc.h

 // Copyright 2009-2011  Karel Vesely;  Petr Motlicek;  Saarland University
 //           2014-2016  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #ifndef KALDI_FEAT_FEATURE_MFCC_H_
 #define KALDI_FEAT_FEATURE_MFCC_H_

 #include <map>
 #include <string>

 #include "feat/feature-common.h"
 #include "feat/feature-functions.h"
 #include "feat/feature-window.h"
 #include "feat/mel-computations.h"

 namespace kaldi {


 struct MfccOptions {
   FrameExtractionOptions frame_opts;
   MelBanksOptions mel_opts;
   int32 num_ceps;  // e.g. 13: num cepstral coeffs, counting zero.
   bool use_energy;  // use energy; else C0
   BaseFloat energy_floor;  // 0 by default; set to a value like 1.0 or 0.1 if
                            // you disable dithering.
   bool raw_energy;  // If true, compute energy before preemphasis and windowing
   BaseFloat cepstral_lifter;  // Scaling factor on cepstra for HTK compatibility.
                               // if 0.0, no liftering is done.
   bool htk_compat;  // if true, put energy/C0 last and introduce a factor of
                     // sqrt(2) on C0 to be the same as HTK.

   MfccOptions() : mel_opts(23),
                   // defaults the #mel-banks to 23 for the MFCC computations.
                   // this seems to be common for 16khz-sampled data,
                   // but for 8khz-sampled data, 15 may be better.
                   num_ceps(13),
                   use_energy(true),
                   energy_floor(0.0),
                   raw_energy(true),
                   cepstral_lifter(22.0),
                   htk_compat(false) {}

   void Register(OptionsItf *opts) {
     frame_opts.Register(opts);
     mel_opts.Register(opts);
     opts->Register("num-ceps", &num_ceps,
                    "Number of cepstra in MFCC computation (including C0)");
     opts->Register("use-energy", &use_energy,
                    "Use energy (not C0) in MFCC computation");
     opts->Register("energy-floor", &energy_floor,
                    "Floor on energy (absolute, not relative) in MFCC computation. "
                    "Only makes a difference if --use-energy=true; only necessary if "
                    "--dither=0.0.  Suggested values: 0.1 or 1.0");
     opts->Register("raw-energy", &raw_energy,
                    "If true, compute energy before preemphasis and windowing");
     opts->Register("cepstral-lifter", &cepstral_lifter,
                    "Constant that controls scaling of MFCCs");
     opts->Register("htk-compat", &htk_compat,
                    "If true, put energy or C0 last and use a factor of sqrt(2) on "
                    "C0.  Warning: not sufficient to get HTK compatible features "
                    "(need to change other parameters).");
   }
 };


 // This is the new-style interface to the MFCC computation.
 class MfccComputer {
  public:
   typedef MfccOptions Options;
   explicit MfccComputer(const MfccOptions &opts);
   MfccComputer(const MfccComputer &other);

   const FrameExtractionOptions &GetFrameOptions() const {
     return opts_.frame_opts;
   }

   int32 Dim() const { return opts_.num_ceps; }

   bool NeedRawLogEnergy() const { return opts_.use_energy && opts_.raw_energy; }

   void Compute(BaseFloat signal_raw_log_energy,
                BaseFloat vtln_warp,
                VectorBase<BaseFloat> *signal_frame,
                VectorBase<BaseFloat> *feature);

   ~MfccComputer();
  private:
   // disallow assignment.
   MfccComputer &operator = (const MfccComputer &in);

  protected:
   const MelBanks *GetMelBanks(BaseFloat vtln_warp);

   MfccOptions opts_;
   Vector<BaseFloat> lifter_coeffs_;
   Matrix<BaseFloat> dct_matrix_;  // matrix we left-multiply by to perform DCT.
   BaseFloat log_energy_floor_;
   std::map<BaseFloat, MelBanks*> mel_banks_;  // BaseFloat is VTLN coefficient.
   SplitRadixRealFft<BaseFloat> *srfft_;

   // note: mel_energies_ is specific to the frame we're processing, it's
   // just a temporary workspace.
   Vector<BaseFloat> mel_energies_;
 };

 typedef OfflineFeatureTpl<MfccComputer> Mfcc;


 }  // namespace kaldi


 #endif  // KALDI_FEAT_FEATURE_MFCC_H_
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::Mfcc
OfflineFeatureTpl< MfccComputer > Mfcc
Definition: feature-mfcc.h:147

feature-functions.h

kaldi::MelBanksOptions::Register
void Register(OptionsItf *opts)
Definition: mel-computations.h:60

kaldi::MfccOptions
MfccOptions contains basic options for computing MFCC features.
Definition: feature-mfcc.h:38

feature-window.h

kaldi::MfccOptions::num_ceps
int32 num_ceps
Definition: feature-mfcc.h:41

kaldi::MfccComputer
Definition: feature-mfcc.h:87

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::Matrix< BaseFloat >

kaldi::MelBanks
Definition: mel-computations.h:78

kaldi::FrameExtractionOptions
Definition: feature-window.h:35

kaldi::OptionsItf::Register
virtual void Register(const std::string &name, bool *ptr, const std::string &doc)=0

kaldi::MfccComputer::mel_energies_
Vector< BaseFloat > mel_energies_
Definition: feature-mfcc.h:144

kaldi::MfccOptions::energy_floor
BaseFloat energy_floor
Definition: feature-mfcc.h:43

kaldi::MfccOptions::cepstral_lifter
BaseFloat cepstral_lifter
Definition: feature-mfcc.h:46

kaldi::MfccComputer::log_energy_floor_
BaseFloat log_energy_floor_
Definition: feature-mfcc.h:138

kaldi::MfccComputer::mel_banks_
std::map< BaseFloat, MelBanks * > mel_banks_
Definition: feature-mfcc.h:139

kaldi::MelBanksOptions
Definition: mel-computations.h:43

kaldi::MfccOptions::mel_opts
MelBanksOptions mel_opts
Definition: feature-mfcc.h:40

kaldi::MfccOptions::use_energy
bool use_energy
Definition: feature-mfcc.h:42

float

kaldi::MfccOptions::frame_opts
FrameExtractionOptions frame_opts
Definition: feature-mfcc.h:39

kaldi::MfccComputer::dct_matrix_
Matrix< BaseFloat > dct_matrix_
Definition: feature-mfcc.h:137

kaldi::MfccOptions::htk_compat
bool htk_compat
Definition: feature-mfcc.h:48

kaldi::MfccComputer::GetFrameOptions
const FrameExtractionOptions & GetFrameOptions() const
Definition: feature-mfcc.h:93

kaldi::FrameExtractionOptions::Register
void Register(OptionsItf *opts)
Definition: feature-window.h:69

kaldi::MfccOptions::raw_energy
bool raw_energy
Definition: feature-mfcc.h:45

kaldi::OptionsItf
Definition: options-itf.h:26

kaldi::SplitRadixRealFft
Definition: srfft.h:105

kaldi::MfccComputer::opts_
MfccOptions opts_
Definition: feature-mfcc.h:135

kaldi::MfccComputer::Options
MfccOptions Options
Definition: feature-mfcc.h:89

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

kaldi::MfccComputer::lifter_coeffs_
Vector< BaseFloat > lifter_coeffs_
Definition: feature-mfcc.h:136

kaldi::MfccComputer::NeedRawLogEnergy
bool NeedRawLogEnergy() const
Definition: feature-mfcc.h:99

kaldi::MfccOptions::Register
void Register(OptionsItf *opts)
Definition: feature-mfcc.h:62

kaldi::OfflineFeatureTpl
This templated class is intended for offline feature extraction, i.e.
Definition: feature-common.h:111

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

mel-computations.h

feature-common.h

kaldi::MfccComputer::srfft_
SplitRadixRealFft< BaseFloat > * srfft_
Definition: feature-mfcc.h:140

kaldi::MfccOptions::MfccOptions
MfccOptions()
Definition: feature-mfcc.h:51

kaldi::MfccComputer::Dim
int32 Dim() const
Definition: feature-mfcc.h:97