doc/combine-nnet_8cc_source.html

 // nnet2/combine-nnet.cc

 // Copyright 2012   Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "nnet2/combine-nnet.h"

 namespace kaldi {
 namespace nnet2 {


 // Here, "scale_params" is in blocks, with the first block
 // corresponding to nnets[0].
 static void CombineNnets(const Vector<BaseFloat> &scale_params,
                          const std::vector<Nnet> &nnets,
                          Nnet *dest) {
   int32 num_nnets = nnets.size();
   KALDI_ASSERT(num_nnets >= 1);
   int32 num_uc = nnets[0].NumUpdatableComponents();
   KALDI_ASSERT(nnets[0].NumUpdatableComponents() >= 1);


   *dest = nnets[0];
   SubVector<BaseFloat> scale_params0(scale_params, 0, num_uc);
   dest->ScaleComponents(scale_params0);
   for (int32 n = 1; n < num_nnets; n++) {
     SubVector<BaseFloat> scale_params_n(scale_params, n * num_uc, num_uc);
     dest->AddNnet(scale_params_n, nnets[n]);
   }
 }

 static int32 GetInitialModel(
     const std::vector<NnetExample> &validation_set,
     const std::vector<Nnet> &nnets) {
   int32 minibatch_size = 1024;
   int32 num_nnets = static_cast<int32>(nnets.size());
   KALDI_ASSERT(!nnets.empty());
   BaseFloat tot_frames = validation_set.size();
   int32 best_n = -1;
   BaseFloat best_objf = -std::numeric_limits<BaseFloat>::infinity();
   Vector<BaseFloat> objfs(nnets.size());
   for (int32 n = 0; n < num_nnets; n++) {
     BaseFloat objf = ComputeNnetObjf(nnets[n], validation_set,
                                      minibatch_size) / tot_frames;

     if (n == 0 || objf > best_objf) {
       best_objf = objf;
       best_n = n;
     }
     objfs(n) = objf;
   }
   KALDI_LOG << "Objective functions for the source neural nets are " << objfs;

   int32 num_uc = nnets[0].NumUpdatableComponents();

   { // Now try a version where all the neural nets have the same weight.
     Vector<BaseFloat> scale_params(num_uc * num_nnets);
     scale_params.Set(1.0 / num_nnets);
     Nnet average_nnet;
     CombineNnets(scale_params, nnets, &average_nnet);
     BaseFloat objf = ComputeNnetObjf(average_nnet, validation_set,
                                      minibatch_size) / tot_frames;
     KALDI_LOG << "Objf with all neural nets averaged is " << objf;
     if (objf > best_objf) {
       return num_nnets;
     } else {
       return best_n;
     }
   }
 }

 // This function chooses from among the neural nets, the one
 // which has the best validation set objective function.
 static void GetInitialScaleParams(
     const NnetCombineConfig &combine_config,
     const std::vector<NnetExample> &validation_set,
     const std::vector<Nnet> &nnets,
     Vector<double> *scale_params) {

   int32 initial_model = combine_config.initial_model,
       num_nnets = static_cast<int32>(nnets.size());
   if (initial_model < 0 || initial_model > num_nnets)
     initial_model = GetInitialModel(validation_set, nnets);

   KALDI_ASSERT(initial_model >= 0 && initial_model <= num_nnets);
   int32 num_uc = nnets[0].NumUpdatableComponents();

   scale_params->Resize(num_uc * num_nnets);
   if (initial_model < num_nnets) {
     KALDI_LOG << "Initializing with neural net with index " << initial_model;
     // At this point we're using the best of the individual neural nets.
     scale_params->Set(0.0);

     // Set the block of parameters corresponding to the "best" of the
     // source neural nets to
     SubVector<double> best_block(*scale_params, num_uc * initial_model, num_uc);
     best_block.Set(1.0);
   } else { // initial_model == num_nnets
     KALDI_LOG << "Initializing with all neural nets averaged.";
     scale_params->Set(1.0 / num_nnets);
   }
 }


 static double ComputeObjfAndGradient(
     const std::vector<NnetExample> &validation_set,
     const Vector<double> &scale_params,
     const std::vector<Nnet> &nnets,
     bool debug,
     Vector<double> *gradient) {

   Vector<BaseFloat> scale_params_float(scale_params);

   Nnet nnet_combined;
   CombineNnets(scale_params_float, nnets, &nnet_combined);

   Nnet nnet_gradient(nnet_combined);
   bool is_gradient = true;
   nnet_gradient.SetZero(is_gradient);

   // note: "ans" is normalized by the total weight of validation frames.
   int32 batch_size = 1024;
   double ans = ComputeNnetGradient(nnet_combined,
                                    validation_set,
                                    batch_size,
                                    &nnet_gradient);

   double tot_frames = validation_set.size();
   if (gradient != NULL) {
     int32 i = 0; // index into scale_params.
     for (int32 n = 0; n < static_cast<int32>(nnets.size()); n++) {
       for (int32 j = 0; j < nnet_combined.NumComponents(); j++) {
         const UpdatableComponent *uc =
             dynamic_cast<const UpdatableComponent*>(&(nnets[n].GetComponent(j))),
             *uc_gradient =
             dynamic_cast<const UpdatableComponent*>(&(nnet_gradient.GetComponent(j)));
         if (uc != NULL) {
           double dotprod = uc->DotProduct(*uc_gradient) / tot_frames;
           (*gradient)(i) = dotprod;
           i++;
         }
       }
     }
     KALDI_ASSERT(i == scale_params.Dim());
   }

   if (debug) {
     KALDI_LOG << "Double-checking gradient computation";

     Vector<BaseFloat> manual_gradient(scale_params.Dim());
     for (int32 i = 0; i < scale_params.Dim(); i++) {
       double delta = 1.0e-04, fg = fabs((*gradient)(i));
       if (fg < 1.0e-07) fg = 1.0e-07;
       if (fg * delta < 1.0e-05)
         delta = 1.0e-05 / fg;

       Vector<double> scale_params_temp(scale_params);
       scale_params_temp(i) += delta;
       double new_ans = ComputeObjfAndGradient(validation_set,
                                               scale_params_temp,
                                               nnets,
                                               false,
                                               NULL);
       manual_gradient(i) = (new_ans - ans) / delta;
     }
     KALDI_LOG << "Manually computed gradient is " << manual_gradient;
     KALDI_LOG << "Gradient we computed is " << *gradient;
   }

   return ans;
 }


 void CombineNnets(const NnetCombineConfig &combine_config,
                   const std::vector<NnetExample> &validation_set,
                   const std::vector<Nnet> &nnets,
                   Nnet *nnet_out) {

   Vector<double> scale_params;

   GetInitialScaleParams(combine_config,
                         validation_set,
                         nnets,
                         &scale_params);

   int32 dim = scale_params.Dim();
   KALDI_ASSERT(dim > 0);
   Vector<double> gradient(dim);

   double objf, initial_objf;

   LbfgsOptions lbfgs_options;
   lbfgs_options.minimize = false; // We're maximizing.
   lbfgs_options.m = dim; // Store the same number of vectors as the dimension
   // itself, so this is BFGS.
   lbfgs_options.first_step_impr = combine_config.initial_impr;

   OptimizeLbfgs<double> lbfgs(scale_params,
                               lbfgs_options);

   for (int32 i = 0; i < combine_config.num_bfgs_iters; i++) {
     scale_params.CopyFromVec(lbfgs.GetProposedValue());
     objf = ComputeObjfAndGradient(validation_set,
                                   scale_params,
                                   nnets,
                                   combine_config.test_gradient,
                                   &gradient);

     KALDI_VLOG(2) << "Iteration " << i << " scale-params = " << scale_params
                   << ", objf = " << objf << ", gradient = " << gradient;

     if (i == 0) initial_objf = objf;

     lbfgs.DoStep(objf, gradient);
   }

   scale_params.CopyFromVec(lbfgs.GetValue(&objf));

   Vector<BaseFloat> scale_params_float(scale_params);

   KALDI_LOG << "Combining nnets, validation objf per frame changed from "
             << initial_objf << " to " << objf;

   Matrix<BaseFloat> scale_params_mat(nnets.size(),
                                      nnets[0].NumUpdatableComponents());
   scale_params_mat.CopyRowsFromVec(scale_params_float);
   KALDI_LOG << "Final scale factors are " << scale_params_mat;

   CombineNnets(scale_params_float, nnets, nnet_out);
 }


 } // namespace nnet2
 } // namespace kaldi
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet2::Nnet::GetComponent
const Component & GetComponent(int32 c) const
Definition: nnet-nnet.cc:141

kaldi::OptimizeLbfgs::DoStep
void DoStep(Real function_value, const VectorBase< Real > &gradient)
The user calls this function to provide the class with the function and gradient info at the point Ge...
Definition: optimization.cc:383

rnnlm::j
int j
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet2::Nnet::AddNnet
void AddNnet(const VectorBase< BaseFloat > &scales, const Nnet &other)
For each updatatable component, adds to it the corresponding element of "other" times the appropriate...
Definition: nnet-nnet.cc:576

kaldi::nnet2::ComputeNnetGradient
double ComputeNnetGradient(const Nnet &nnet, const std::vector< NnetExample > &validation_set, int32 batch_size, Nnet *gradient)
ComputeNnetGradient is mostly used to compute gradients on validation sets; it divides the example in...
Definition: nnet-update.cc:302

kaldi::nnet2::NnetCombineConfig::test_gradient
bool test_gradient
Definition: combine-nnet.h:45

kaldi::nnet2::GetInitialScaleParams
static void GetInitialScaleParams(const NnetCombineConfig &combine_config, const std::vector< NnetExample > &validation_set, const std::vector< Nnet > &nnets, Vector< double > *scale_params)
Definition: combine-nnet.cc:91

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::OptimizeLbfgs::GetValue
const VectorBase< Real > & GetValue(Real *objf_value=NULL) const
This returns the value of the variable x that has the best objective function so far, and the corresponding objective function value if requested.
Definition: optimization.cc:416

kaldi::Matrix< BaseFloat >

kaldi::nnet2::GetInitialModel
static int32 GetInitialModel(const std::vector< NnetExample > &validation_set, const std::vector< Nnet > &nnets)
Returns an integer saying which model to use: either 0 ...
Definition: combine-nnet.cc:49

kaldi::Vector::Resize
void Resize(MatrixIndexT length, MatrixResizeType resize_type=kSetZero)
Set vector to a specified size (can be zero).
Definition: kaldi-vector.cc:190

kaldi::nnet2::ComputeNnetObjf
double ComputeNnetObjf(const Nnet &nnet, const std::vector< NnetExample > &examples, double *tot_accuracy)
Computes objective function over a minibatch.
Definition: nnet-update.cc:258

kaldi::nnet2::NnetCombineConfig::initial_model
int32 initial_model
Definition: combine-nnet.h:36

kaldi::nnet2::Nnet::NumComponents
int32 NumComponents() const
Returns number of components– think of this as similar to # of layers, but e.g.
Definition: nnet-nnet.h:69

kaldi::VectorBase::CopyFromVec
void CopyFromVec(const VectorBase< Real > &v)
Copy data from another vector (must match own size).
Definition: kaldi-vector.cc:228

kaldi::nnet2::Nnet::SetZero
void SetZero(bool treat_as_gradient)
Definition: nnet-nnet.cc:151

float

kaldi::nnet2::UpdatableComponent::DotProduct
virtual BaseFloat DotProduct(const UpdatableComponent &other) const =0
Here, "other" is a component of the same specific type.

rnnlm::n
struct rnnlm::@11::@12 n

kaldi::nnet2::Nnet
Definition: nnet-nnet.h:63

kaldi::OptimizeLbfgs
Definition: optimization.h:121

kaldi::VectorBase::Dim
MatrixIndexT Dim() const
Returns the dimension of the vector.
Definition: kaldi-vector.h:64

kaldi::LbfgsOptions::minimize
bool minimize
Definition: optimization.h:85

kaldi::nnet2::NnetCombineConfig
Configuration class that controls neural net combination, where we combine a number of neural nets...
Definition: combine-nnet.h:35

kaldi::LbfgsOptions::m
int m
Definition: optimization.h:86

kaldi::nnet2::Nnet::ScaleComponents
void ScaleComponents(const VectorBase< BaseFloat > &scales)
Scales the parameters of each of the updatable components.
Definition: nnet-nnet.cc:421

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::LbfgsOptions::first_step_impr
float first_step_impr
Definition: optimization.h:94

kaldi::Vector
A class representing a vector.
Definition: kaldi-vector.h:406

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::VectorBase::Set
void Set(Real f)
Set all members of a vector to a specified value.
Definition: kaldi-vector.cc:336

kaldi::nnet2::NnetCombineConfig::num_bfgs_iters
int32 num_bfgs_iters
Definition: combine-nnet.h:38

KALDI_VLOG
#define KALDI_VLOG(v)
Definition: kaldi-error.h:156

kaldi::nnet2::CombineNnets
static void CombineNnets(const Vector< BaseFloat > &scale_params, const std::vector< Nnet > &nnets, Nnet *dest)
Definition: combine-nnet.cc:28

kaldi::nnet2::NnetCombineConfig::initial_impr
BaseFloat initial_impr
Definition: combine-nnet.h:44

kaldi::LbfgsOptions
This is an implementation of L-BFGS.
Definition: optimization.h:84

kaldi::MatrixBase::CopyRowsFromVec
void CopyRowsFromVec(const VectorBase< Real > &v)
This function has two modes of operation.
Definition: kaldi-matrix.cc:997

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

combine-nnet.h

kaldi::SubVector
Represents a non-allocating general vector which can be defined as a sub-vector of higher-level vecto...
Definition: kaldi-vector.h:501

kaldi::OptimizeLbfgs::GetProposedValue
const VectorBase< Real > & GetProposedValue() const
This returns the value at which the function wants us to compute the objective function and gradient...
Definition: optimization.h:134

kaldi::nnet3::NumUpdatableComponents
int32 NumUpdatableComponents(const Nnet &dest)
Returns the number of updatable components in the nnet.
Definition: nnet-utils.cc:422

kaldi::nnet2::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters and contains some global param...
Definition: nnet-component.h:279

kaldi::nnet2::ComputeObjfAndGradient
static BaseFloat ComputeObjfAndGradient(const std::vector< NnetExample > &validation_set, const Vector< double > &scale_params, const Nnet &orig_nnet, const Nnet &direction, Vector< double > *gradient)
Definition: combine-nnet-a.cc:61