doc/shrink-nnet_8cc_source.html

 // nnet2/shrink-nnet.cc

 // Copyright 2012   Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "nnet2/shrink-nnet.h"

 namespace kaldi {
 namespace nnet2 {

 static BaseFloat ComputeObjfAndGradient(
     const std::vector<NnetExample> &validation_set,
     const Vector<double> &log_scale_params,
     const Nnet &nnet,
     Vector<double> *gradient) {
   Vector<BaseFloat> scale_params(log_scale_params);
   scale_params.ApplyExp();
   Nnet nnet_scaled(nnet);
   nnet_scaled.ScaleComponents(scale_params);

   Nnet nnet_gradient(nnet);
   bool is_gradient = true;
   nnet_gradient.SetZero(is_gradient);

   // note: "ans" is normalized by the total weight of validation frames.
   int32 batch_size = 1024;
   BaseFloat ans = ComputeNnetGradient(nnet_scaled,
                                       validation_set,
                                       batch_size,
                                       &nnet_gradient);

   BaseFloat tot_count = validation_set.size();
   int32 i = 0; // index into log_scale_params.
   for (int32 j = 0; j < nnet_scaled.NumComponents(); j++) {
     const UpdatableComponent *uc =
         dynamic_cast<const UpdatableComponent*>(&(nnet.GetComponent(j))),
         *uc_gradient =
         dynamic_cast<const UpdatableComponent*>(&(nnet_gradient.GetComponent(j)));
     if (uc != NULL) {
       BaseFloat dotprod = uc->DotProduct(*uc_gradient) / tot_count;
       (*gradient)(i) = dotprod * scale_params(i); // gradient w.r.t log of scaling factor.
       // We multiply by scale_params(i) to take into account d/dx exp(x); "gradient"
       // is the gradient w.r.t. the log of the scale_params.
       i++;
     }
   }
   KALDI_ASSERT(i == log_scale_params.Dim());
   return ans;
 }


 void ShrinkNnet(const NnetShrinkConfig &shrink_config,
                 const std::vector<NnetExample> &validation_set,
                 Nnet *nnet) {

   int32 dim = nnet->NumUpdatableComponents();
   KALDI_ASSERT(dim > 0);
   Vector<double> log_scale(dim), gradient(dim); // will be zero.

   // Get initial gradient.
   double objf, initial_objf;


   LbfgsOptions lbfgs_options;
   lbfgs_options.minimize = false; // We're maximizing.
   lbfgs_options.m = dim; // Store the same number of vectors as the dimension
   // itself, so this is BFGS.
   lbfgs_options.first_step_length = shrink_config.initial_step;

   OptimizeLbfgs<double> lbfgs(log_scale,
                               lbfgs_options);

   for (int32 i = 0; i < shrink_config.num_bfgs_iters; i++) {
     log_scale.CopyFromVec(lbfgs.GetProposedValue());
     objf = ComputeObjfAndGradient(validation_set, log_scale,
                                   *nnet,
                                   &gradient);

     KALDI_VLOG(2) << "log-scale = " << log_scale << ", objf = " << objf
                   << ", gradient = " << gradient;
     if (i == 0) initial_objf = objf;

     lbfgs.DoStep(objf, gradient);
   }

   log_scale.CopyFromVec(lbfgs.GetValue(&objf));

   Vector<BaseFloat> scale(log_scale);
   scale.ApplyExp();
   KALDI_LOG << "Shrinking nnet, validation objf per frame changed from "
             << initial_objf << " to " << objf << ", scale factors per layer are "
             << scale;
   nnet->ScaleComponents(scale);
 }


 } // namespace nnet2
 } // namespace kaldi
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet2::Nnet::GetComponent
const Component & GetComponent(int32 c) const
Definition: nnet-nnet.cc:141

kaldi::OptimizeLbfgs::DoStep
void DoStep(Real function_value, const VectorBase< Real > &gradient)
The user calls this function to provide the class with the function and gradient info at the point Ge...
Definition: optimization.cc:383

kaldi::VectorBase::ApplyExp
void ApplyExp()
Apply exponential to each value in vector.
Definition: kaldi-vector.cc:800

shrink-nnet.h

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet2::Nnet::NumUpdatableComponents
int32 NumUpdatableComponents() const
Returns the number of updatable components.
Definition: nnet-nnet.cc:413

kaldi::nnet2::ComputeNnetGradient
double ComputeNnetGradient(const Nnet &nnet, const std::vector< NnetExample > &validation_set, int32 batch_size, Nnet *gradient)
ComputeNnetGradient is mostly used to compute gradients on validation sets; it divides the example in...
Definition: nnet-update.cc:302

kaldi::nnet2::NnetShrinkConfig::initial_step
BaseFloat initial_step
Definition: shrink-nnet.h:39

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::OptimizeLbfgs::GetValue
const VectorBase< Real > & GetValue(Real *objf_value=NULL) const
This returns the value of the variable x that has the best objective function so far, and the corresponding objective function value if requested.
Definition: optimization.cc:416

kaldi::nnet2::Nnet::NumComponents
int32 NumComponents() const
Returns number of components– think of this as similar to # of layers, but e.g.
Definition: nnet-nnet.h:69

kaldi::nnet2::NnetShrinkConfig
Configuration class that controls neural net "shrinkage" which is actually a scaling on the parameter...
Definition: shrink-nnet.h:33

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::nnet2::Nnet::SetZero
void SetZero(bool treat_as_gradient)
Definition: nnet-nnet.cc:151

kaldi::nnet2::UpdatableComponent::DotProduct
virtual BaseFloat DotProduct(const UpdatableComponent &other) const =0
Here, "other" is a component of the same specific type.

kaldi::LbfgsOptions::first_step_length
float first_step_length
Definition: optimization.h:90

kaldi::nnet2::Nnet
Definition: nnet-nnet.h:63

kaldi::OptimizeLbfgs
Definition: optimization.h:121

kaldi::nnet2::ShrinkNnet
void ShrinkNnet(const NnetShrinkConfig &shrink_config, const std::vector< NnetExample > &validation_set, Nnet *nnet)
Definition: shrink-nnet.cc:66

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::LbfgsOptions::minimize
bool minimize
Definition: optimization.h:85

kaldi::nnet2::NnetShrinkConfig::num_bfgs_iters
int32 num_bfgs_iters
Definition: shrink-nnet.h:34

kaldi::LbfgsOptions::m
int m
Definition: optimization.h:86

kaldi::nnet2::Nnet::ScaleComponents
void ScaleComponents(const VectorBase< BaseFloat > &scales)
Scales the parameters of each of the updatable components.
Definition: nnet-nnet.cc:421

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::Vector< double >

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::LbfgsOptions
This is an implementation of L-BFGS.
Definition: optimization.h:84

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::OptimizeLbfgs::GetProposedValue
const VectorBase< Real > & GetProposedValue() const
This returns the value at which the function wants us to compute the objective function and gradient...
Definition: optimization.h:134

kaldi::nnet2::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters and contains some global param...
Definition: nnet-component.h:279

kaldi::nnet2::ComputeObjfAndGradient
static BaseFloat ComputeObjfAndGradient(const std::vector< NnetExample > &validation_set, const Vector< double > &scale_params, const Nnet &orig_nnet, const Nnet &direction, Vector< double > *gradient)
Definition: combine-nnet-a.cc:61