doc/online-nnet2-decoding-threaded_8cc_source.html

 // online2/online-nnet2-decoding-threaded.cc

 // Copyright    2013-2014  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "online2/online-nnet2-decoding-threaded.h"
 #include "nnet2/nnet-compute-online.h"
 #include "lat/lattice-functions.h"
 #include "lat/determinize-lattice-pruned.h"
 #include "util/kaldi-thread.h"

 namespace kaldi {

 ThreadSynchronizer::ThreadSynchronizer():
     abort_(false),
     producer_waiting_(false),
     consumer_waiting_(false),
     num_errors_(0) {
   producer_semaphore_.Signal();
   consumer_semaphore_.Signal();
 }

 bool ThreadSynchronizer::Lock(ThreadType t) {
   if (abort_)
     return false;
   if (t == ThreadSynchronizer::kProducer) {
     producer_semaphore_.Wait();
   } else {
     consumer_semaphore_.Wait();
   }
   if (abort_)
     return false;
   mutex_.lock();
   held_by_ = t;
   if (abort_) {
     mutex_.unlock();
     return false;
   } else {
     return true;
   }
 }

 bool ThreadSynchronizer::UnlockSuccess(ThreadType t) {
   if (t == ThreadSynchronizer::kProducer) {
     producer_semaphore_.Signal();  // next Lock won't wait.
     if (consumer_waiting_) {
       consumer_semaphore_.Signal();
       consumer_waiting_ = false;
     }
   } else {
     consumer_semaphore_.Signal(); // next Lock won't wait.
     if (producer_waiting_) {
       producer_semaphore_.Signal();
       producer_waiting_ = false;
     }

   }
   mutex_.unlock();
   return !abort_;
 }

 bool ThreadSynchronizer::UnlockFailure(ThreadType t) {

   KALDI_ASSERT(held_by_ == t && "Code error: unlocking a mutex you don't hold.");

   if (t == ThreadSynchronizer::kProducer) {
     KALDI_ASSERT(!producer_waiting_ && "code error.");
     producer_waiting_ = true;
   } else {
     KALDI_ASSERT(!consumer_waiting_ && "code error.");
     consumer_waiting_ = true;
   }
   mutex_.unlock();
   return !abort_;
 }

 void ThreadSynchronizer::SetAbort() {
   abort_ = true;
   // we signal the semaphores just in case someone was waiting on either of
   // them.
   producer_semaphore_.Signal();
   consumer_semaphore_.Signal();
 }

 ThreadSynchronizer::~ThreadSynchronizer() {
 }

 // static
 void OnlineNnet2DecodingThreadedConfig::Check() {
   KALDI_ASSERT(max_buffered_features > 1);
   KALDI_ASSERT(feature_batch_size > 0);
   KALDI_ASSERT(max_loglikes_copy >= 0);
   KALDI_ASSERT(nnet_batch_size > 0);
   KALDI_ASSERT(decode_batch_size >= 1);
 }


 SingleUtteranceNnet2DecoderThreaded::SingleUtteranceNnet2DecoderThreaded(
     const OnlineNnet2DecodingThreadedConfig &config,
     const TransitionModel &tmodel,
     const nnet2::AmNnet &am_nnet,
     const fst::Fst<fst::StdArc> &fst,
     const OnlineNnet2FeaturePipelineInfo &feature_info,
     const OnlineIvectorExtractorAdaptationState &adaptation_state,
     const OnlineCmvnState &cmvn_state):
   config_(config), am_nnet_(am_nnet), tmodel_(tmodel), sampling_rate_(0.0),
   num_samples_received_(0), input_finished_(false),
   feature_pipeline_(feature_info),
   num_samples_discarded_(0),
   silence_weighting_(tmodel, feature_info.silence_weighting_config),
   decodable_(tmodel),
   num_frames_decoded_(0), decoder_(fst, config_.decoder_opts),
   abort_(false), error_(false) {
   // if the user supplies an adaptation state that was not freshly initialized,
   // it means that we take the adaptation state from the previous
   // utterance(s)... this only makes sense if theose previous utterance(s) are
   // believed to be from the same speaker.
   feature_pipeline_.SetAdaptationState(adaptation_state);
   feature_pipeline_.SetCmvnState(cmvn_state);
   // spawn threads.
   threads_[0] = std::thread(RunNnetEvaluation, this);
   decoder_.InitDecoding();
   threads_[1] = std::thread(RunDecoderSearch, this);
 }


 SingleUtteranceNnet2DecoderThreaded::~SingleUtteranceNnet2DecoderThreaded() {
   if (!abort_) {
     // If we have not already started the process of aborting the threads, do so now.
     bool error = false;
     AbortAllThreads(error);
   }
   // join all the threads (this avoids leaving zombie threads around, or threads
   // that might be accessing deconstructed object).
   WaitForAllThreads();
   while (!input_waveform_.empty()) {
     delete input_waveform_.front();
     input_waveform_.pop_front();
   }
   while (!processed_waveform_.empty()) {
     delete processed_waveform_.front();
     processed_waveform_.pop_front();
   }
 }

 void SingleUtteranceNnet2DecoderThreaded::AcceptWaveform(
     BaseFloat sampling_rate,
     const VectorBase<BaseFloat> &wave_part) {
   if (sampling_rate_ <= 0.0)
     sampling_rate_ = sampling_rate;
   else {
     KALDI_ASSERT(sampling_rate == sampling_rate_);
   }
   num_samples_received_ += wave_part.Dim();

   if (wave_part.Dim() == 0) return;
   if (!waveform_synchronizer_.Lock(ThreadSynchronizer::kProducer)) {
     KALDI_ERR << "Failure locking mutex: decoding aborted.";
   }

   Vector<BaseFloat> *new_part = new Vector<BaseFloat>(wave_part);
   input_waveform_.push_back(new_part);
   // we always unlock with success because there is no buffer size limitation
   // for the waveform so no reason why we might wait.
   waveform_synchronizer_.UnlockSuccess(ThreadSynchronizer::kProducer);
 }

 int32 SingleUtteranceNnet2DecoderThreaded::NumWaveformPiecesPending() {
   // Note RE locking: what we really want here is just to lock the mutex.  As a
   // side effect, because of the way the synchronizer code works, it will also
   // increment the semaphore and might wake up the consumer thread.  This will
   // possibly make it do a little useless work (go around a loop once), but
   // won't really do any harm.  Perhaps we should have implemented a version of
   // the Lock function that takes no arguments.
   if (!waveform_synchronizer_.Lock(ThreadSynchronizer::kProducer)) {
     KALDI_ERR << "Failure locking mutex: decoding aborted.";
   }
   int32 ans = input_waveform_.size();
   waveform_synchronizer_.UnlockSuccess(ThreadSynchronizer::kProducer);
   return ans;
 }


 int32 SingleUtteranceNnet2DecoderThreaded::NumFramesReceivedApprox() const {
   return num_samples_received_ /
       (sampling_rate_ * feature_pipeline_.FrameShiftInSeconds());
 }

 void SingleUtteranceNnet2DecoderThreaded::InputFinished() {
   // setting input_finished_ = true informs the feature-processing pipeline
   // to expect no more input, and to flush out the last few frames if there
   // is any latency in the pipeline (e.g. due to pitch).
   if (!waveform_synchronizer_.Lock(ThreadSynchronizer::kProducer)) {
     KALDI_ERR << "Failure locking mutex: decoding aborted.";
   }
   KALDI_ASSERT(!input_finished_ && "InputFinished called twice");
   input_finished_ = true;
   waveform_synchronizer_.UnlockSuccess(ThreadSynchronizer::kProducer);
 }

 void SingleUtteranceNnet2DecoderThreaded::TerminateDecoding() {
   bool error = false;
   AbortAllThreads(error);
 }

 void SingleUtteranceNnet2DecoderThreaded::Wait() {
   if (!input_finished_ && !abort_) {
     KALDI_ERR << "You cannot call Wait() before calling either InputFinished() "
               << "or TerminateDecoding().";
   }
   WaitForAllThreads();
 }

 void SingleUtteranceNnet2DecoderThreaded::FinalizeDecoding() {
   if (threads_[0].joinable()) {
     KALDI_ERR << "It is an error to call FinalizeDecoding before Wait().";
   }
   decoder_.FinalizeDecoding();
 }

 BaseFloat SingleUtteranceNnet2DecoderThreaded::GetRemainingWaveform(
     Vector<BaseFloat> *waveform) const {
   if (threads_[0].joinable()) {
     KALDI_ERR << "It is an error to call GetRemainingWaveform before Wait().";
   }
   int64 num_samples_stored = 0;  // number of samples we still have.
   std::vector< Vector<BaseFloat>* > all_pieces;
   std::deque< Vector<BaseFloat>* >::const_iterator iter;
   for (iter = processed_waveform_.begin(); iter != processed_waveform_.end();
        ++iter) {
     num_samples_stored += (*iter)->Dim();
     all_pieces.push_back(*iter);
   }
   for (iter = input_waveform_.begin(); iter != input_waveform_.end(); ++iter) {
     num_samples_stored += (*iter)->Dim();
     all_pieces.push_back(*iter);
   }
   int64 samples_shift_per_frame =
       sampling_rate_ * feature_pipeline_.FrameShiftInSeconds();
   int64 num_samples_to_discard = samples_shift_per_frame * num_frames_decoded_;
   KALDI_ASSERT(num_samples_to_discard >= num_samples_discarded_);

   // num_samp_discard is how many samples we must discard from our stored
   // samples.
   int64 num_samp_discard = num_samples_to_discard - num_samples_discarded_,
       num_samp_keep = num_samples_stored - num_samp_discard;
   KALDI_ASSERT(num_samp_discard <= num_samples_stored && num_samp_keep >= 0);
   waveform->Resize(num_samp_keep, kUndefined);
   int32 offset = 0; // offset in output waveform.  assume output waveform is no
                     // larger than int32.
   for (size_t i = 0; i < all_pieces.size(); i++) {
     Vector<BaseFloat> *this_piece = all_pieces[i];
     int32 this_dim = this_piece->Dim();
     if (num_samp_discard >= this_dim) {
       num_samp_discard -= this_dim;
     } else {
       // normal case is num_samp_discard = 0.
       int32 this_dim_keep = this_dim - num_samp_discard;
       waveform->Range(offset, this_dim_keep).CopyFromVec(
           this_piece->Range(num_samp_discard, this_dim_keep));
       offset += this_dim_keep;
       num_samp_discard = 0;
     }
   }
   KALDI_ASSERT(offset == num_samp_keep && num_samp_discard == 0);
   return sampling_rate_;
 }

 void SingleUtteranceNnet2DecoderThreaded::GetAdaptationState(
     OnlineIvectorExtractorAdaptationState *adaptation_state) {
   std::lock_guard<std::mutex> lock(feature_pipeline_mutex_);
   // If this blocks, it shouldn't be for very long.
   feature_pipeline_.GetAdaptationState(adaptation_state);
 }

 void SingleUtteranceNnet2DecoderThreaded::GetCmvnState(
     OnlineCmvnState *cmvn_state) {
   std::lock_guard<std::mutex> lock(feature_pipeline_mutex_);
   // If this blocks, it shouldn't be for very long.
   feature_pipeline_.GetCmvnState(cmvn_state);
 }

 void SingleUtteranceNnet2DecoderThreaded::GetLattice(
     bool end_of_utterance,
     CompactLattice *clat,
     BaseFloat *final_relative_cost) const {
   clat->DeleteStates();
   decoder_mutex_.lock();
   if (final_relative_cost != NULL)
     *final_relative_cost = decoder_.FinalRelativeCost();
   if (decoder_.NumFramesDecoded() == 0) {
     decoder_mutex_.unlock();
     clat->SetFinal(clat->AddState(),
                    CompactLatticeWeight::One());
     return;
   }
   Lattice raw_lat;
   decoder_.GetRawLattice(&raw_lat, end_of_utterance);
   decoder_mutex_.unlock();

   if (!config_.decoder_opts.determinize_lattice)
     KALDI_ERR << "--determinize-lattice=false option is not supported at the moment";

   BaseFloat lat_beam = config_.decoder_opts.lattice_beam;
   DeterminizeLatticePhonePrunedWrapper(
       tmodel_, &raw_lat, lat_beam, clat, config_.decoder_opts.det_opts);
 }

 void SingleUtteranceNnet2DecoderThreaded::GetBestPath(
     bool end_of_utterance,
     Lattice *best_path,
     BaseFloat *final_relative_cost) const {
   std::lock_guard<std::mutex> lock(decoder_mutex_);
   if (decoder_.NumFramesDecoded() == 0) {
     // It's possible that this if-statement is not necessary because we'd get this
     // anyway if we just called GetBestPath on the decoder.
     best_path->DeleteStates();
     best_path->SetFinal(best_path->AddState(),
                         LatticeWeight::One());
     if (final_relative_cost != NULL)
       *final_relative_cost = std::numeric_limits<BaseFloat>::infinity();
   } else {
     decoder_.GetBestPath(best_path,
                          end_of_utterance);
     if (final_relative_cost != NULL)
       *final_relative_cost = decoder_.FinalRelativeCost();
   }
 }

 void SingleUtteranceNnet2DecoderThreaded::AbortAllThreads(bool error) {
   abort_ = true;
   if (error)
     error_ = true;
   waveform_synchronizer_.SetAbort();
   decodable_synchronizer_.SetAbort();
 }

 int32 SingleUtteranceNnet2DecoderThreaded::NumFramesDecoded() const {
   std::lock_guard<std::mutex> lock(decoder_mutex_);
   return decoder_.NumFramesDecoded();
 }

 void SingleUtteranceNnet2DecoderThreaded::RunNnetEvaluation(
     SingleUtteranceNnet2DecoderThreaded *me) {
   try {
     if (!me->RunNnetEvaluationInternal() && !me->abort_)
       KALDI_ERR << "Returned abnormally and abort was not called";
   } catch(const std::exception &e) {
     KALDI_WARN << "Caught exception: " << e.what();
     // if an error happened in one thread, we need to make sure the other
     // threads can exit too.
     bool error = true;
     me->AbortAllThreads(error);
   }
 }

 void SingleUtteranceNnet2DecoderThreaded::RunDecoderSearch(
     SingleUtteranceNnet2DecoderThreaded *me) {
   try {
     if (!me->RunDecoderSearchInternal() && !me->abort_)
       KALDI_ERR << "Returned abnormally and abort was not called";
   } catch(const std::exception &e) {
     KALDI_WARN << "Caught exception: " << e.what();
     // if an error happened in one thread, we need to make sure the other threads can exit too.
     bool error = true;
     me->AbortAllThreads(error);
   }
 }


 void SingleUtteranceNnet2DecoderThreaded::WaitForAllThreads() {
   for (int32 i = 0; i < 2; i++) {  // there are 2 spawned threads.
     if (threads_[i].joinable())
       threads_[i].join();
   }
   if (error_)
     KALDI_ERR << "Error encountered during decoding.  See above.";
 }


 void SingleUtteranceNnet2DecoderThreaded::ProcessLoglikes(
     const CuVector<BaseFloat> &log_inv_prior,
     CuMatrixBase<BaseFloat> *cu_loglikes) {
   if (cu_loglikes->NumRows() != 0) {
     cu_loglikes->ApplyFloor(1.0e-20);
     cu_loglikes->ApplyLog();
     // take the log-posteriors and turn them into pseudo-log-likelihoods by
     // dividing by the pdf priors; then scale by the acoustic scale.
     cu_loglikes->AddVecToRows(1.0, log_inv_prior);
     cu_loglikes->Scale(config_.acoustic_scale);
   }
 }

 // called from RunNnetEvaluationInternal().  Returns true in the normal case,
 // false on error; if it returns false, then we expect that the calling thread
 // will terminate.  This assumes the calling thread has already
 // locked feature_pipeline_mutex_.
 bool SingleUtteranceNnet2DecoderThreaded::FeatureComputation(
     int32 num_frames_consumed) {

   int32 num_frames_ready = feature_pipeline_.NumFramesReady(),
       num_frames_usable = num_frames_ready - num_frames_consumed;
   bool features_done = feature_pipeline_.IsLastFrame(num_frames_ready - 1);
   KALDI_ASSERT(num_frames_usable >= 0);
   if (features_done) {
     return true;  // nothing to do. (but not an error).
   } else {
     if (num_frames_usable >= config_.nnet_batch_size)
       return true;  // We don't need more data yet.

     // Now try to get more data, if we can.
     if (!waveform_synchronizer_.Lock(ThreadSynchronizer::kConsumer)) {
       return false;
     }
     // we've got the lock.
     if (input_waveform_.empty()) {  // we got no data
       if (input_finished_ &&
           !feature_pipeline_.IsLastFrame(feature_pipeline_.NumFramesReady()-1)) {
         // the main thread called InputFinished() and set input_finished_, and
         // we haven't yet registered that fact.  This is progress so
         // unlock with UnlockSuccess().
         feature_pipeline_.InputFinished();
         return waveform_synchronizer_.UnlockSuccess(ThreadSynchronizer::kConsumer);
       } else {
         // there is no progress.  Unlock with UnlockFailure() so the next call to
         // waveform_synchronizer_.Lock() will lock.
         return waveform_synchronizer_.UnlockFailure(ThreadSynchronizer::kConsumer);
       }
     } else {  // we got some data.  Only take enough of the waveform to
               // give us a maximum nnet batch size of frames to decode.
       while (num_frames_usable < config_.nnet_batch_size &&
              !input_waveform_.empty()) {
         feature_pipeline_.AcceptWaveform(sampling_rate_, *input_waveform_.front());
         processed_waveform_.push_back(input_waveform_.front());
         input_waveform_.pop_front();
         num_frames_ready = feature_pipeline_.NumFramesReady();
         num_frames_usable = num_frames_ready - num_frames_consumed;
       }
       // Delete already-processed pieces of waveform if we have already decoded
       // those frames.  (If not already decoded, we keep them around for the
       // sake of GetRemainingWaveform()).
       int32 samples_shift_per_frame =
           sampling_rate_ * feature_pipeline_.FrameShiftInSeconds();
       while (!processed_waveform_.empty() &&
              num_samples_discarded_ + processed_waveform_.front()->Dim() <
              samples_shift_per_frame * num_frames_decoded_) {
         num_samples_discarded_ += processed_waveform_.front()->Dim();
         delete processed_waveform_.front();
         processed_waveform_.pop_front();
       }
       return waveform_synchronizer_.UnlockSuccess(ThreadSynchronizer::kConsumer);
     }
   }
 }

 bool SingleUtteranceNnet2DecoderThreaded::RunNnetEvaluationInternal() {
   // if any of the Lock/Unlock functions return false, it's because AbortAllThreads()
   // was called.

   // This object is responsible for keeping track of the context, and avoiding
   // re-computing things we've already computed.
   bool pad_input = true;
   nnet2::NnetOnlineComputer computer(am_nnet_.GetNnet(), pad_input);

   // we declare the following as CuVector just to enable GPU support, but
   // we expect this code to be run on CPU in the normal case.
   CuVector<BaseFloat> log_inv_prior(am_nnet_.Priors());
   log_inv_prior.ApplyFloor(1.0e-20);  // should have no effect.
   log_inv_prior.ApplyLog();
   log_inv_prior.Scale(-1.0);

   // we'll have num_frames_consumed >= num_frames_output; num_frames_consumed is
   // the number of feature frames consumed by the nnet computation,
   // num_frames_output is the number of frames of loglikes the nnet computation
   // has produced, which may be less than num_frames_consumed due to the
   // right-context of the network.
   int32 num_frames_consumed = 0, num_frames_output = 0;

   while (true) {
     bool last_time = false;

     /****** Begin locking of feature pipeline mutex. ******/
     feature_pipeline_mutex_.lock();
     if (!FeatureComputation(num_frames_consumed)) {  // error
       feature_pipeline_mutex_.unlock();
       return false;
     }
     // take care of silence weighting.
     if (silence_weighting_.Active() &&
         feature_pipeline_.IvectorFeature() != NULL) {
       silence_weighting_mutex_.lock();
       std::vector<std::pair<int32, BaseFloat> > delta_weights;
       silence_weighting_.GetDeltaWeights(
           feature_pipeline_.IvectorFeature()->NumFramesReady(),
           &delta_weights);
       silence_weighting_mutex_.unlock();
       feature_pipeline_.IvectorFeature()->UpdateFrameWeights(delta_weights);
     }

     int32 num_frames_ready = feature_pipeline_.NumFramesReady(),
         num_frames_usable = num_frames_ready - num_frames_consumed;
     bool features_done = feature_pipeline_.IsLastFrame(num_frames_ready - 1);

     int32 num_frames_evaluate = std::min<int32>(num_frames_usable,
                                                 config_.nnet_batch_size);

     Matrix<BaseFloat> feats;
     if (num_frames_evaluate > 0) {
       // we have something to do...
       feats.Resize(num_frames_evaluate, feature_pipeline_.Dim());
       for (int32 i = 0; i < num_frames_evaluate; i++) {
         int32 t = num_frames_consumed + i;
         SubVector<BaseFloat> feat(feats, i);
         feature_pipeline_.GetFrame(t, &feat);
       }
     }
     /****** End locking of feature pipeline mutex. ******/
     feature_pipeline_mutex_.unlock();

     CuMatrix<BaseFloat> cu_loglikes;

     if (feats.NumRows() == 0) {
       if (features_done) {
         // flush out the last few frames.  Note: this is the only place from
         // which we check feature_buffer_finished_, and we'll exit the loop, so
         // if we reach here it must be the first time it was true.
         last_time = true;
         computer.Flush(&cu_loglikes);
         ProcessLoglikes(log_inv_prior, &cu_loglikes);
       }
     } else {
       CuMatrix<BaseFloat> cu_feats;
       cu_feats.Swap(&feats);  // If we don't have a GPU (and not having a GPU is
                               // the normal expected use-case for this code),
                               // this would be a lightweight operation, swapping
                               // pointers.

       computer.Compute(cu_feats, &cu_loglikes);
       num_frames_consumed += cu_feats.NumRows();
       ProcessLoglikes(log_inv_prior, &cu_loglikes);
     }

     Matrix<BaseFloat> loglikes;
     loglikes.Swap(&cu_loglikes);  // If we don't have a GPU (and not having a
                                   // GPU is the normal expected use-case for
                                   // this code), this would be a lightweight
                                   // operation, swapping pointers.


     // OK, at this point we may have some newly created log-likes and we want to
     // give them to the decoding thread.

     int32 num_loglike_frames = loglikes.NumRows();

     if (num_loglike_frames != 0) {  // if we need to output some loglikes...
       while (true) {
         // we may have to grab and release the decodable mutex
         // a few times before it's ready to accept the loglikes.
         if (!decodable_synchronizer_.Lock(ThreadSynchronizer::kProducer))
           return false;
         int32 num_frames_decoded = num_frames_decoded_;
         // we can't have output fewer frames than were decoded.
         KALDI_ASSERT(num_frames_output >= num_frames_decoded);
         if (num_frames_output - num_frames_decoded <= config_.max_loglikes_copy) {
           // If we would have to copy fewer than config_.max_loglikes_copy
           // previously output log-likelihoods inside the decodable object, then
           // we go ahead and copy them to that object.
           int32 frames_to_discard = num_frames_decoded_ -
               decodable_.FirstAvailableFrame();
           KALDI_ASSERT(frames_to_discard >= 0);
           num_frames_output += num_loglike_frames;
           decodable_.AcceptLoglikes(&loglikes, frames_to_discard);
           if (!decodable_synchronizer_.UnlockSuccess(ThreadSynchronizer::kProducer))
             return false;
           break;  // break from the innermost while loop.
         } else {
           // There are too many frames already available to the decoder, that it
           // hasn't processed yet, and we don't want them to have to be copied
           // inside AcceptLoglikes(), so we wait for a bit.
           // we want the next call to Lock to block until the decoder has
           //  processed more frames.
           if (!decodable_synchronizer_.UnlockFailure(ThreadSynchronizer::kProducer))
             return false;
         }
       }
     }
     if (last_time) {
       // Inform the decodable object that there will be no more input.
       if (!decodable_synchronizer_.Lock(ThreadSynchronizer::kProducer))
         return false;
       decodable_.InputIsFinished();
       if (!decodable_synchronizer_.UnlockSuccess(ThreadSynchronizer::kProducer))
         return false;
       KALDI_ASSERT(num_frames_consumed == num_frames_output);
       return true;
     }
   }
 }


 bool SingleUtteranceNnet2DecoderThreaded::RunDecoderSearchInternal() {
   int32 num_frames_decoded = 0;  // this is just a copy of decoder_->NumFramesDecoded();
   while (true) {  // decode at most one frame each loop.
     if (!decodable_synchronizer_.Lock(ThreadSynchronizer::kConsumer))
       return false; // AbortAllThreads() called.
     if (decodable_.NumFramesReady() <= num_frames_decoded) {
       // no frames available to decode.
       KALDI_ASSERT(decodable_.NumFramesReady() == num_frames_decoded);
       if (decodable_.IsLastFrame(num_frames_decoded - 1)) {
         decodable_synchronizer_.UnlockSuccess(ThreadSynchronizer::kConsumer);
         return true;  // exit from this thread; we're done.
       } else {
         // we were not able to advance the decoding due to no available
         // input.  The next call will ensure that the next call to
         // decodable_synchronizer_.Lock() will wait.
         if (!decodable_synchronizer_.UnlockFailure(ThreadSynchronizer::kConsumer))
           return false;
       }
     } else {
       // Decode at most config_.decode_batch_size frames (e.g. 1 or 2).
       decoder_mutex_.lock();
       decoder_.AdvanceDecoding(&decodable_, config_.decode_batch_size);
       num_frames_decoded = decoder_.NumFramesDecoded();
       if (silence_weighting_.Active()) {
         std::lock_guard<std::mutex> lock(silence_weighting_mutex_);
         // the next function does not trace back all the way; it's very fast.
         silence_weighting_.ComputeCurrentTraceback(decoder_);
       }
       decoder_mutex_.unlock();
       num_frames_decoded_ = num_frames_decoded;
       if (!decodable_synchronizer_.UnlockSuccess(ThreadSynchronizer::kConsumer))
         return false;
     }
   }
 }

 bool SingleUtteranceNnet2DecoderThreaded::EndpointDetected(
     const OnlineEndpointConfig &config) {
   std::lock_guard<std::mutex> lock(decoder_mutex_);
   return kaldi::EndpointDetected(config, tmodel_,
                                  feature_pipeline_.FrameShiftInSeconds(),
                                  decoder_);
 }


 }  // namespace kaldi
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::SingleUtteranceNnet2DecoderThreaded::am_nnet_
const nnet2::AmNnet & am_nnet_
Definition: online-nnet2-decoding-threaded.h:353

kaldi::SingleUtteranceNnet2DecoderThreaded::silence_weighting_
OnlineSilenceWeighting silence_weighting_
Definition: online-nnet2-decoding-threaded.h:394

kaldi::SingleUtteranceNnet2DecoderThreaded::error_
bool error_
Definition: online-nnet2-decoding-threaded.h:432

kaldi::DecodableMatrixMappedOffset::NumFramesReady
virtual int32 NumFramesReady() const
The call NumFramesReady() will return the number of frames currently available for this decodable obj...
Definition: decodable-matrix.h:171

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::SingleUtteranceNnet2DecoderThreaded::EndpointDetected
bool EndpointDetected(const OnlineEndpointConfig &config)
This function calls EndpointDetected from online-endpoint.h, with the required arguments.
Definition: online-nnet2-decoding-threaded.cc:651

kaldi::OnlineNnet2FeaturePipeline::Dim
virtual int32 Dim() const
Member functions from OnlineFeatureInterface:
Definition: online-nnet2-feature-pipeline.cc:149

kaldi::SingleUtteranceNnet2DecoderThreaded::FeatureComputation
bool FeatureComputation(int32 num_frames_output)
Definition: online-nnet2-decoding-threaded.cc:412

kaldi::ThreadSynchronizer::held_by_
ThreadType held_by_
Definition: online-nnet2-decoding-threaded.h:103

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::OnlineNnet2DecodingThreadedConfig::nnet_batch_size
int32 nnet_batch_size
Definition: online-nnet2-decoding-threaded.h:143

kaldi::LatticeFasterDecoderConfig::lattice_beam
BaseFloat lattice_beam
Definition: lattice-faster-decoder.h:42

kaldi::OnlineNnet2DecodingThreadedConfig::decoder_opts
LatticeFasterDecoderConfig decoder_opts
Definition: online-nnet2-decoding-threaded.h:123

kaldi-thread.h

kaldi::SingleUtteranceNnet2DecoderThreaded::waveform_synchronizer_
ThreadSynchronizer waveform_synchronizer_
Definition: online-nnet2-decoding-threaded.h:374

kaldi::LatticeFasterDecoderTpl::GetRawLattice
bool GetRawLattice(Lattice *ofst, bool use_final_probs=true) const
Outputs an FST corresponding to the raw, state-level tracebacks.
Definition: lattice-faster-decoder.cc:106

kaldi::SingleUtteranceNnet2DecoderThreaded::num_frames_decoded_
int32 num_frames_decoded_
Definition: online-nnet2-decoding-threaded.h:408

kaldi::ThreadSynchronizer::mutex_
std::mutex mutex_
Definition: online-nnet2-decoding-threaded.h:102

kaldi::SingleUtteranceNnet2DecoderThreaded::input_waveform_
std::deque< Vector< BaseFloat > *> input_waveform_
Definition: online-nnet2-decoding-threaded.h:371

fst::LatticeWeightTpl< BaseFloat >::One
static const LatticeWeightTpl One()
Definition: lattice-weight.h:81

kaldi::SingleUtteranceNnet2DecoderThreaded::RunDecoderSearch
static void RunDecoderSearch(SingleUtteranceNnet2DecoderThreaded *me)
Definition: online-nnet2-decoding-threaded.cc:371

kaldi::nnet2::AmNnet
Definition: am-nnet.h:38

kaldi::DecodableMatrixMappedOffset::InputIsFinished
void InputIsFinished()
Definition: decodable-matrix.h:169

kaldi::SingleUtteranceNnet2DecoderThreaded
You will instantiate this class when you want to decode a single utterance using the online-decoding ...
Definition: online-nnet2-decoding-threaded.h:190

kaldi::ThreadSynchronizer::producer_semaphore_
Semaphore producer_semaphore_
Definition: online-nnet2-decoding-threaded.h:105

fst
For an extended explanation of the framework of which grammar-fsts are a part, please see Support for...
Definition: graph.dox:21

kaldi::SingleUtteranceNnet2DecoderThreaded::GetBestPath
void GetBestPath(bool end_of_utterance, Lattice *best_path, BaseFloat *final_relative_cost) const
Outputs an FST corresponding to the single best path through the current lattice. ...
Definition: online-nnet2-decoding-threaded.cc:323

kaldi::OnlineNnet2FeaturePipeline::GetAdaptationState
void GetAdaptationState(OnlineIvectorExtractorAdaptationState *adaptation_state) const
Get the adaptation state; you may want to call this before destroying this object, to get adaptation state that can be used to improve decoding of later utterances of this speaker.
Definition: online-nnet2-feature-pipeline.cc:177

kaldi::SingleUtteranceNnet2DecoderThreaded::feature_pipeline_
OnlineNnet2FeaturePipeline feature_pipeline_
Definition: online-nnet2-decoding-threaded.h:380

kaldi::SingleUtteranceNnet2DecoderThreaded::decoder_mutex_
std::mutex decoder_mutex_
Definition: online-nnet2-decoding-threaded.h:417

kaldi::Semaphore::Signal
void Signal()
increase the counter
Definition: kaldi-semaphore.cc:51

kaldi::SingleUtteranceNnet2DecoderThreaded::tmodel_
const TransitionModel & tmodel_
Definition: online-nnet2-decoding-threaded.h:355

kaldi::OnlineNnet2FeaturePipeline::IsLastFrame
virtual bool IsLastFrame(int32 frame) const
Returns true if this is the last frame.
Definition: online-nnet2-feature-pipeline.cc:151

kaldi::OnlineIvectorExtractorAdaptationState
This class stores the adaptation state from the online iVector extractor, which can help you to initi...
Definition: online-ivector-feature.h:211

kaldi::ThreadSynchronizer::abort_
bool abort_
Definition: online-nnet2-decoding-threaded.h:99

kaldi::SingleUtteranceNnet2DecoderThreaded::AbortAllThreads
void AbortAllThreads(bool error)
Definition: online-nnet2-decoding-threaded.cc:344

kaldi::CuMatrixBase::ApplyFloor
void ApplyFloor(Real floor_val)
Definition: cu-matrix.h:451

kaldi::SingleUtteranceNnet2DecoderThreaded::sampling_rate_
BaseFloat sampling_rate_
Definition: online-nnet2-decoding-threaded.h:359

kaldi::SingleUtteranceNnet2DecoderThreaded::WaitForAllThreads
void WaitForAllThreads()
Definition: online-nnet2-decoding-threaded.cc:385

kaldi::OnlineEndpointConfig
Definition: online-endpoint.h:127

kaldi::OnlineNnet2FeaturePipeline::GetFrame
virtual void GetFrame(int32 frame, VectorBase< BaseFloat > *feat)
Gets the feature vector for this frame.
Definition: online-nnet2-feature-pipeline.cc:159

kaldi::OnlineNnet2FeaturePipeline::InputFinished
void InputFinished()
If you call InputFinished(), it tells the class you won&#39;t be providing any more waveform.
Definition: online-nnet2-feature-pipeline.cc:225

kaldi::SingleUtteranceNnet2DecoderThreaded::NumFramesReceivedApprox
int32 NumFramesReceivedApprox() const
Returns *approximately* (ignoring end effects), the number of frames of data that we expect given the...
Definition: online-nnet2-decoding-threaded.cc:198

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet2::NnetOnlineComputer
Definition: nnet-compute-online.h:41

kaldi::LatticeFasterDecoderTpl::FinalizeDecoding
void FinalizeDecoding()
This function may be optionally called after AdvanceDecoding(), when you do not plan to decode any fu...
Definition: lattice-faster-decoder.cc:625

kaldi::Matrix< BaseFloat >

kaldi::EndpointDetected
bool EndpointDetected(const OnlineEndpointConfig &config, int32 num_frames_decoded, int32 trailing_silence_frames, BaseFloat frame_shift_in_seconds, BaseFloat final_relative_cost)
This function returns true if this set of endpointing rules thinks we should terminate decoding...
Definition: online-endpoint.cc:46

kaldi::OnlineNnet2FeaturePipeline::FrameShiftInSeconds
BaseFloat FrameShiftInSeconds() const
Definition: online-nnet2-feature-pipeline.h:257

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::SingleUtteranceNnet2DecoderThreaded::feature_pipeline_mutex_
std::mutex feature_pipeline_mutex_
Definition: online-nnet2-decoding-threaded.h:381

kaldi::Vector::Resize
void Resize(MatrixIndexT length, MatrixResizeType resize_type=kSetZero)
Set vector to a specified size (can be zero).
Definition: kaldi-vector.cc:190

kaldi::Matrix::Swap
void Swap(Matrix< Real > *other)
Swaps the contents of *this and *other. Shallow swap.
Definition: kaldi-matrix.cc:2255

kaldi::OnlineNnet2FeaturePipeline::IvectorFeature
OnlineIvectorFeature * IvectorFeature()
This function returns the iVector-extracting part of the feature pipeline (or NULL if iVectors are no...
Definition: online-nnet2-feature-pipeline.h:271

kaldi::SingleUtteranceNnet2DecoderThreaded::FinalizeDecoding
void FinalizeDecoding()
Finalizes the decoding.
Definition: online-nnet2-decoding-threaded.cc:228

kaldi::OnlineNnet2FeaturePipeline::NumFramesReady
virtual int32 NumFramesReady() const
returns the feature dimension.
Definition: online-nnet2-feature-pipeline.cc:155

kaldi::SingleUtteranceNnet2DecoderThreaded::threads_
std::thread threads_[2]
Definition: online-nnet2-decoding-threaded.h:423

kaldi::CuVectorBase::ApplyFloor
void ApplyFloor(Real floor_val, MatrixIndexT *floored_count=NULL)
Definition: cu-vector.h:139

kaldi::ThreadSynchronizer::ThreadType
ThreadType
Definition: online-nnet2-decoding-threaded.h:72

kaldi::CuMatrixBase::ApplyLog
void ApplyLog()
Definition: cu-matrix.h:480

kaldi::OnlineNnet2FeaturePipelineInfo
This class is responsible for storing configuration variables, objects and options for OnlineNnet2Fea...
Definition: online-nnet2-feature-pipeline.h:138

kaldi::TransitionModel
Definition: transition-model.h:123

lattice-functions.h

kaldi::ThreadSynchronizer::UnlockFailure
bool UnlockFailure(ThreadType t)
Definition: online-nnet2-decoding-threaded.cc:76

kaldi::SingleUtteranceNnet2DecoderThreaded::decodable_synchronizer_
ThreadSynchronizer decodable_synchronizer_
Definition: online-nnet2-decoding-threaded.h:409

kaldi::SingleUtteranceNnet2DecoderThreaded::InputFinished
void InputFinished()
You call this to inform the class that no more waveform will be provided; this allows it to flush out...
Definition: online-nnet2-decoding-threaded.cc:203

kaldi::CuMatrixBase::Scale
void Scale(Real value)
Definition: cu-matrix.cc:644

kaldi::SingleUtteranceNnet2DecoderThreaded::GetRemainingWaveform
BaseFloat GetRemainingWaveform(Vector< BaseFloat > *waveform_out) const
Gets the remaining, un-decoded part of the waveform and returns the sample rate.
Definition: online-nnet2-decoding-threaded.cc:235

kaldi::SingleUtteranceNnet2DecoderThreaded::processed_waveform_
std::deque< Vector< BaseFloat > *> processed_waveform_
Definition: online-nnet2-decoding-threaded.h:389

kaldi::OnlineNnet2FeaturePipeline::AcceptWaveform
void AcceptWaveform(BaseFloat sampling_rate, const VectorBase< BaseFloat > &waveform)
Accept more data to process.
Definition: online-nnet2-feature-pipeline.cc:217

kaldi::ThreadSynchronizer::kProducer
Definition: online-nnet2-decoding-threaded.h:72

kaldi::LatticeFasterDecoderTpl::InitDecoding
void InitDecoding()
InitDecoding initializes the decoding, and should only be used if you intend to call AdvanceDecoding(...
Definition: lattice-faster-decoder.cc:56

kaldi::SingleUtteranceNnet2DecoderThreaded::NumWaveformPiecesPending
int32 NumWaveformPiecesPending()
Returns the number of pieces of waveform that are still waiting to be processed.
Definition: online-nnet2-decoding-threaded.cc:182

kaldi::OnlineSilenceWeighting::ComputeCurrentTraceback
void ComputeCurrentTraceback(const LatticeFasterOnlineDecoderTpl< FST > &decoder)
Definition: online-ivector-feature.cc:482

kaldi::CuMatrixBase::AddVecToRows
void AddVecToRows(Real alpha, const CuVectorBase< Real > &row, Real beta=1.0)
(for each row r of *this), r = alpha * row + beta * r
Definition: cu-matrix.cc:1261

float

kaldi::SingleUtteranceNnet2DecoderThreaded::RunDecoderSearchInternal
bool RunDecoderSearchInternal()
Definition: online-nnet2-decoding-threaded.cc:615

fst::CompactLatticeWeightTpl::One
static const CompactLatticeWeightTpl< WeightType, IntType > One()
Definition: lattice-weight.h:460

kaldi::OnlineNnet2DecodingThreadedConfig::decode_batch_size
int32 decode_batch_size
Definition: online-nnet2-decoding-threaded.h:148

kaldi::CuMatrix::Swap
void Swap(Matrix< Real > *mat)
Definition: cu-matrix.cc:123

kaldi::OnlineSilenceWeighting::Active
bool Active() const
Definition: online-ivector-feature.h:478

kaldi::LatticeFasterDecoderTpl::NumFramesDecoded
int32 NumFramesDecoded() const
Definition: lattice-faster-decoder.h:340

kaldi::nnet2::AmNnet::Priors
const VectorBase< BaseFloat > & Priors() const
Definition: am-nnet.h:67

kaldi::SingleUtteranceNnet2DecoderThreaded::config_
OnlineNnet2DecodingThreadedConfig config_
Definition: online-nnet2-decoding-threaded.h:351

kaldi::OnlineCmvnState
Struct OnlineCmvnState stores the state of CMVN adaptation between utterances (but not the state of t...
Definition: online-feature.h:266

nnet-compute-online.h

kaldi::ThreadSynchronizer::UnlockSuccess
bool UnlockSuccess(ThreadType t)
Definition: online-nnet2-decoding-threaded.cc:57

kaldi::SingleUtteranceNnet2DecoderThreaded::RunNnetEvaluationInternal
bool RunNnetEvaluationInternal()
Definition: online-nnet2-decoding-threaded.cc:470

kaldi::SingleUtteranceNnet2DecoderThreaded::SingleUtteranceNnet2DecoderThreaded
SingleUtteranceNnet2DecoderThreaded(const OnlineNnet2DecodingThreadedConfig &config, const TransitionModel &tmodel, const nnet2::AmNnet &am_nnet, const fst::Fst< fst::StdArc > &fst, const OnlineNnet2FeaturePipelineInfo &feature_info, const OnlineIvectorExtractorAdaptationState &adaptation_state, const OnlineCmvnState &cmvn_state)
Definition: online-nnet2-decoding-threaded.cc:112

kaldi::ThreadSynchronizer::kConsumer
Definition: online-nnet2-decoding-threaded.h:72

kaldi::Lattice
fst::VectorFst< LatticeArc > Lattice
Definition: kaldi-lattice.h:44

determinize-lattice-pruned.h

kaldi::ThreadSynchronizer::Lock
bool Lock(ThreadType t)
Definition: online-nnet2-decoding-threaded.cc:37

kaldi::OnlineNnet2DecodingThreadedConfig::Check
void Check()
Definition: online-nnet2-decoding-threaded.cc:103

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::SingleUtteranceNnet2DecoderThreaded::TerminateDecoding
void TerminateDecoding()
You can call this if you don&#39;t want the decoding to proceed further with this utterance.
Definition: online-nnet2-decoding-threaded.cc:215

kaldi::DecodableMatrixMappedOffset::FirstAvailableFrame
int32 FirstAvailableFrame() const
Definition: decodable-matrix.h:158

online-nnet2-decoding-threaded.h

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::SingleUtteranceNnet2DecoderThreaded::GetAdaptationState
void GetAdaptationState(OnlineIvectorExtractorAdaptationState *adaptation_state)
Outputs the adaptation state of the feature pipeline to "adaptation_state".
Definition: online-nnet2-decoding-threaded.cc:283

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::SingleUtteranceNnet2DecoderThreaded::silence_weighting_mutex_
std::mutex silence_weighting_mutex_
Definition: online-nnet2-decoding-threaded.h:395

kaldi::SingleUtteranceNnet2DecoderThreaded::num_samples_received_
int64 num_samples_received_
Definition: online-nnet2-decoding-threaded.h:362

kaldi::SingleUtteranceNnet2DecoderThreaded::input_finished_
bool input_finished_
Definition: online-nnet2-decoding-threaded.h:370

kaldi::OnlineNnet2FeaturePipeline::GetCmvnState
void GetCmvnState(OnlineCmvnState *cmvn_state)
Definition: online-nnet2-feature-pipeline.cc:191

kaldi::OnlineNnet2FeaturePipeline::SetAdaptationState
void SetAdaptationState(const OnlineIvectorExtractorAdaptationState &adaptation_state)
Set the adaptation state to a particular value, e.g.
Definition: online-nnet2-feature-pipeline.cc:169

kaldi::ThreadSynchronizer::consumer_waiting_
bool consumer_waiting_
Definition: online-nnet2-decoding-threaded.h:101

kaldi::SingleUtteranceNnet2DecoderThreaded::decoder_
LatticeFasterOnlineDecoder decoder_
Definition: online-nnet2-decoding-threaded.h:412

kaldi::CompactLattice
fst::VectorFst< CompactLatticeArc > CompactLattice
Definition: kaldi-lattice.h:46

kaldi::OnlineNnet2FeaturePipeline::SetCmvnState
void SetCmvnState(const OnlineCmvnState &cmvn_state)
Set the CMVN state to a particular value.
Definition: online-nnet2-feature-pipeline.cc:185

kaldi::SingleUtteranceNnet2DecoderThreaded::decodable_
DecodableMatrixMappedOffset decodable_
Definition: online-nnet2-decoding-threaded.h:407

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::LatticeFasterDecoderConfig::det_opts
fst::DeterminizeLatticePhonePrunedOptions det_opts
Definition: lattice-faster-decoder.h:56

kaldi::OnlineIvectorFeature::UpdateFrameWeights
void UpdateFrameWeights(const std::vector< std::pair< int32, BaseFloat > > &delta_weights)
Definition: online-ivector-feature.cc:169

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::ThreadSynchronizer::SetAbort
void SetAbort()
Definition: online-nnet2-decoding-threaded.cc:91

kaldi::LatticeFasterDecoderTpl::FinalRelativeCost
BaseFloat FinalRelativeCost() const
FinalRelativeCost() serves the same purpose as ReachedFinal(), but gives more information.
Definition: lattice-faster-decoder.cc:461

kaldi::LatticeFasterDecoderTpl::AdvanceDecoding
void AdvanceDecoding(DecodableInterface *decodable, int32 max_num_frames=-1)
This will decode until there are no more frames ready in the decodable object.
Definition: lattice-faster-decoder.cc:580

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::SingleUtteranceNnet2DecoderThreaded::abort_
bool abort_
Definition: online-nnet2-decoding-threaded.h:427

kaldi::OnlineNnet2DecodingThreadedConfig::acoustic_scale
BaseFloat acoustic_scale
Definition: online-nnet2-decoding-threaded.h:125

kaldi::DecodableMatrixMappedOffset::IsLastFrame
virtual bool IsLastFrame(int32 frame) const
Returns true if this is the last frame.
Definition: decodable-matrix.h:175

kaldi::OnlineNnet2DecodingThreadedConfig
Definition: online-nnet2-decoding-threaded.h:121

kaldi::LatticeFasterDecoderConfig::determinize_lattice
bool determinize_lattice
Definition: lattice-faster-decoder.h:44

kaldi::SingleUtteranceNnet2DecoderThreaded::num_samples_discarded_
int64 num_samples_discarded_
Definition: online-nnet2-decoding-threaded.h:390

kaldi::OnlineNnet2DecodingThreadedConfig::max_loglikes_copy
int32 max_loglikes_copy
Definition: online-nnet2-decoding-threaded.h:135

kaldi::Matrix::Resize
void Resize(const MatrixIndexT r, const MatrixIndexT c, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Sets matrix to a specified size (zero is OK as long as both r and c are zero).
Definition: kaldi-matrix.cc:819

kaldi::SingleUtteranceNnet2DecoderThreaded::ProcessLoglikes
void ProcessLoglikes(const CuVector< BaseFloat > &log_inv_prior, CuMatrixBase< BaseFloat > *loglikes)
Definition: online-nnet2-decoding-threaded.cc:395

kaldi::OnlineIvectorFeature::NumFramesReady
virtual int32 NumFramesReady() const
returns the feature dimension.
Definition: online-ivector-feature.cc:160

kaldi::SingleUtteranceNnet2DecoderThreaded::Wait
void Wait()
This call will block until all the data has been decoded; it must only be called after either InputFi...
Definition: online-nnet2-decoding-threaded.cc:220

kaldi::LatticeFasterOnlineDecoderTpl::GetBestPath
bool GetBestPath(Lattice *ofst, bool use_final_probs=true) const
Outputs an FST corresponding to the single best path through the lattice.
Definition: lattice-faster-online-decoder.cc:56

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::SingleUtteranceNnet2DecoderThreaded::GetLattice
void GetLattice(bool end_of_utterance, CompactLattice *clat, BaseFloat *final_relative_cost) const
Gets the lattice.
Definition: online-nnet2-decoding-threaded.cc:297

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::SingleUtteranceNnet2DecoderThreaded::AcceptWaveform
void AcceptWaveform(BaseFloat samp_freq, const VectorBase< BaseFloat > &wave_part)
You call this to provide this class with more waveform to decode.
Definition: online-nnet2-decoding-threaded.cc:160

kaldi::ThreadSynchronizer::~ThreadSynchronizer
~ThreadSynchronizer()
Definition: online-nnet2-decoding-threaded.cc:99

kaldi::SingleUtteranceNnet2DecoderThreaded::RunNnetEvaluation
static void RunNnetEvaluation(SingleUtteranceNnet2DecoderThreaded *me)
Definition: online-nnet2-decoding-threaded.cc:357

kaldi::ThreadSynchronizer::consumer_semaphore_
Semaphore consumer_semaphore_
Definition: online-nnet2-decoding-threaded.h:106

kaldi::ThreadSynchronizer::producer_waiting_
bool producer_waiting_
Definition: online-nnet2-decoding-threaded.h:100

kaldi::SingleUtteranceNnet2DecoderThreaded::~SingleUtteranceNnet2DecoderThreaded
~SingleUtteranceNnet2DecoderThreaded()
Definition: online-nnet2-decoding-threaded.cc:141

kaldi::SingleUtteranceNnet2DecoderThreaded::GetCmvnState
void GetCmvnState(OnlineCmvnState *cmvn_state)
Outputs the OnlineCmvnState of the feature pipeline to "cmvn_stat".
Definition: online-nnet2-decoding-threaded.cc:290

kaldi::DecodableMatrixMappedOffset::AcceptLoglikes
void AcceptLoglikes(Matrix< BaseFloat > *loglikes, int32 frames_to_discard)
Definition: decodable-matrix.cc:81

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501

fst::DeterminizeLatticePhonePrunedWrapper
bool DeterminizeLatticePhonePrunedWrapper(const kaldi::TransitionModel &trans_model, MutableFst< kaldi::LatticeArc > *ifst, double beam, MutableFst< kaldi::CompactLatticeArc > *ofst, DeterminizeLatticePhonePrunedOptions opts)
This function is a wrapper of DeterminizeLatticePhonePruned() that works for Lattice type FSTs...
Definition: determinize-lattice-pruned.cc:1488

kaldi::Semaphore::Wait
void Wait()
decrease the counter
Definition: kaldi-semaphore.cc:44

kaldi::nnet2::AmNnet::GetNnet
const Nnet & GetNnet() const
Definition: am-nnet.h:61

kaldi::ThreadSynchronizer::ThreadSynchronizer
ThreadSynchronizer()
Definition: online-nnet2-decoding-threaded.cc:28

kaldi::SingleUtteranceNnet2DecoderThreaded::NumFramesDecoded
int32 NumFramesDecoded() const
Returns the number of frames currently decoded.
Definition: online-nnet2-decoding-threaded.cc:352

kaldi::OnlineSilenceWeighting::GetDeltaWeights
void GetDeltaWeights(int32 num_frames_ready, int32 first_decoder_frame, std::vector< std::pair< int32, BaseFloat > > *delta_weights)
Definition: online-ivector-feature.cc:597

kaldi::VectorBase::Range
SubVector< Real > Range(const MatrixIndexT o, const MatrixIndexT l)
Returns a sub-vector of a vector (a range of elements).
Definition: kaldi-vector.h:94