doc/cu-math_8h_source.html

 // cudamatrix/cu-math.h

 // Copyright 2009-2012  Karel Vesely
 //                2013  Johns Hopkins University (Author: David Snyder)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_CUDAMATRIX_CU_MATH_H_
 #define KALDI_CUDAMATRIX_CU_MATH_H_
 #include "cudamatrix/cu-common.h"
 #include "cudamatrix/cu-array.h"
 #include "cudamatrix/cu-device.h"
 #include "base/timer.h"

 namespace kaldi {

 namespace cu {

 template<typename Real>
 void RegularizeL1(CuMatrixBase<Real> *weight, CuMatrixBase<Real> *gradient,
                   Real l1_penalty, Real learning_rate);

 template<typename Real>
 void Randomize(const CuMatrixBase<Real> &src,
                const CuArray<int32> &copy_from_idx,
                CuMatrixBase<Real> *tgt);

 template<typename Real>
 void Splice(const CuMatrixBase<Real> &src,
             const CuArray<int32> &frame_offsets,
             CuMatrixBase<Real> *tgt);

 template<typename Real>
 void Copy(const CuMatrixBase<Real> &src,
           const CuArray<int32> &copy_from_indices,
           CuMatrixBase<Real> *tgt);


 template <typename Real>
 void EnsureNonzero(const CuMatrixBase<Real> &src,
                    Real epsilon,
                    CuMatrixBase<Real> *dest);

 template <typename Real>
 void EnsureNonzero(const CuVectorBase<Real> &src,
                    Real epsilon,
                    CuVectorBase<Real> *dest);

 template<typename Real>
 void ComputeLstmNonlinearity(const CuMatrixBase<Real> &input,
                              const CuMatrixBase<Real> &params,
                              CuMatrixBase<Real> *output);
 // This is a version of ComputeLstmNonlinearity that only uses the CPU
 // even if a GPU is available. It's made available for testing purposes.
 template<typename Real>
 void CpuComputeLstmNonlinearity(const MatrixBase<Real> &input,
                                 const MatrixBase<Real> &params,
                                 MatrixBase<Real> *output);


 template<typename Real>
 void BackpropLstmNonlinearity(const CuMatrixBase<Real> &input,
                               const CuMatrixBase<Real> &params,
                               const CuMatrixBase<Real> &output_deriv,
                               const CuMatrixBase<double> &deriv_sum_in,
                               const CuVectorBase<Real> &self_repair_config,
                               double count_in,
                               CuMatrixBase<Real> *input_deriv,
                               CuMatrixBase<Real> *params_deriv,
                               CuMatrixBase<double> *value_sum_out,
                               CuMatrixBase<double> *deriv_sum_out,
                               CuMatrixBase<Real> *self_repair_sum_out);
 // This is a version of BackpropLstmNonlinearity that only uses the CPU
 // even if a GPU is available. It's made available for testing purposes.
 template<typename Real>
 void CpuBackpropLstmNonlinearity(const MatrixBase<Real> &input,
                                  const MatrixBase<Real> &params,
                                  const MatrixBase<Real> &output_deriv,
                                  const MatrixBase<double> &deriv_sum_in,
                                  const VectorBase<Real> &self_repair_config,
                                  double count_in,
                                  MatrixBase<Real> *input_deriv,
                                  MatrixBase<Real> *params_deriv,
                                  MatrixBase<double> *value_sum_out,
                                  MatrixBase<double> *deriv_sum_out,
                                  MatrixBase<Real> *self_repair_sum_out);

 template<typename Real>
 void NormalizePerRow(const CuMatrixBase<Real>& in, const Real target_rms,
                      const bool add_log_stddev, CuMatrixBase<Real>* out);

 // A note on the derivative of NormalizeComponent...
 // let both row_in and row_out be vectors of dimension D.
 // Let p = row_in^T row_in / (D * target_rms^2), and let
 // f = 1.0 / sqrt(max(kSquaredNormFloor, p)), and we compute row_out as:
 // row_out = f row_in.
 // Suppose we have a quantity deriv_out which is the derivative
 // of the objective function w.r.t. row_out.  We want to compute
 // deriv_in which is the derivative of the objective function w.r.t.
 // row_in.  Let the objective function be F.  One term is obvious: we have
 // deriv_in = f deriv_out + ....
 // next we have to take into account the derivative that gets back-propagated
 // through f.  Obviously, dF/df = deriv_out^T row_in.
 // And df/dp = (p <= kSquaredNormFloor ? 0.0 : -0.5 p^{-1.5}) = (f == 1.0 / sqrt(kSquaredNormFloor) ? 0.0 : -0.5 f^3),
 // and dp/d(row_in) = 2/(D * target_rms^2) row_in. [it's vector_valued].
 // So this term in dF/d(row_in) equals:
 // dF/df df/dp dp/d(row_in)   =    2/(D * target_rms^2) (f == 1.0 / sqrt(kSquaredNormFloor)  ? 0.0 : -0.5 f^3) (deriv_out^T row_in) row_in
 // So
 // deriv_in = f deriv_out + (f == 1.0 ? 0.0 : -f^3  / (D * target_rms^2) ) (deriv_out^T row_in) row_in
 //  if add_log_stddev_ true, the deriv_in has another term as
 // dF/dx_i = dF/df . df/dx_i => df/dx_i = x_i/(x^T x)
 template<typename Real>
 void DiffNormalizePerRow(const CuMatrixBase<Real> &in_value,
                          const CuMatrixBase<Real> &out_deriv,
                          const Real target_rms, const bool add_log_stddev,
                          CuMatrixBase<Real>* in_deriv);


 } // namespace cu
 } // namespace kaldi


 #endif
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::cu::CpuComputeLstmNonlinearity
void CpuComputeLstmNonlinearity(const MatrixBase< Real > &input_mat, const MatrixBase< Real > &params_mat, MatrixBase< Real > *output)
Definition: cu-math.cc:445

cu-device.h

kaldi::cu::Randomize
void Randomize(const CuMatrixBase< Real > &src, const CuArray< int32 > &copy_from_idx, CuMatrixBase< Real > *tgt)
Copies a permutation of src into tgt.
Definition: cu-math.cc:80

timer.h

kaldi::cu::BackpropLstmNonlinearity
void BackpropLstmNonlinearity(const CuMatrixBase< Real > &input, const CuMatrixBase< Real > &params, const CuMatrixBase< Real > &output_deriv, const CuMatrixBase< double > &deriv_sum_in, const CuVectorBase< Real > &self_repair_config, double count_in, CuMatrixBase< Real > *input_deriv, CuMatrixBase< Real > *params_deriv, CuMatrixBase< double > *value_sum_out, CuMatrixBase< double > *deriv_sum_out, CuMatrixBase< Real > *self_repair_sum_out)
This function does the &#39;backward&#39; pass corresponding to the function ComputeLstmNonlinearity.
Definition: cu-math.cc:768

kaldi::cu::DiffNormalizePerRow
void DiffNormalizePerRow(const CuMatrixBase< Real > &in_value, const CuMatrixBase< Real > &out_deriv, const Real target_rms, const bool add_log_stddev, CuMatrixBase< Real > *in_deriv)
Definition: cu-math.cc:349

kaldi::cu::EnsureNonzero
void EnsureNonzero(const CuMatrixBase< Real > &src, Real epsilon, CuMatrixBase< Real > *dest)
This function requires that src and dest have the same dimension and epsilon > 0. ...
Definition: cu-math.cc:209

kaldi::cu::Splice
void Splice(const CuMatrixBase< Real > &src, const CuArray< int32 > &frame_offsets, CuMatrixBase< Real > *tgt)
Splice concatenates frames of src as specified in frame_offsets into tgt.
Definition: cu-math.cc:132

cu-common.h

kaldi::cu::NormalizePerRow
void NormalizePerRow(const CuMatrixBase< Real > &in, const Real target_rms, const bool add_log_stddev, CuMatrixBase< Real > *out)
Normalize nonlinearity modifies the vector of activations by scaling it so that the root-mean-square ...
Definition: cu-math.cc:280

cu-array.h

kaldi::cu::RegularizeL1
void RegularizeL1(CuMatrixBase< Real > *weight, CuMatrixBase< Real > *grad, Real l1, Real lr)
RegularizeL1 is a gradient step with l1 regularization added to the gradient.
Definition: cu-math.cc:37

kaldi::cu::Copy
void Copy(const CuMatrixBase< Real > &src, const CuArray< int32 > &copy_from_indices, CuMatrixBase< Real > *tgt)
Copies elements from src into tgt as given by copy_from_indices.
Definition: cu-math.cc:173

kaldi::cu::CpuBackpropLstmNonlinearity
void CpuBackpropLstmNonlinearity(const MatrixBase< Real > &input, const MatrixBase< Real > &params, const MatrixBase< Real > &output_deriv, const MatrixBase< double > &deriv_sum_in, const VectorBase< Real > &self_repair_config, double count_in, MatrixBase< Real > *input_deriv, MatrixBase< Real > *params_deriv, MatrixBase< double > *value_sum_out, MatrixBase< double > *deriv_sum_out, MatrixBase< Real > *self_repair_sum_out)
Definition: cu-math.cc:543

kaldi::cu::ComputeLstmNonlinearity
void ComputeLstmNonlinearity(const CuMatrixBase< Real > &input, const CuMatrixBase< Real > &params, CuMatrixBase< Real > *output)
this is a special-purpose function used by class LstmNonlinearityComponent, to do its forward propaga...
Definition: cu-math.cc:489