doc/cu-rand_8cc_source.html

 // cudamatrix/cu-rand.cc

 // Copyright 2016-2017  Brno University of Technology (author Karel Vesely)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include "cudamatrix/cu-rand.h"

 namespace kaldi {

 #if HAVE_CUDA == 1

 template<typename Real>
 curandStatus_t curandGenerateUniformWrap(curandGenerator_t gen, Real *ptr, size_t num);
 //
 template<>
 curandStatus_t curandGenerateUniformWrap(curandGenerator_t gen, float *ptr, size_t num) {
   return curandGenerateUniform(gen, ptr, num);
 }
 template<>
 curandStatus_t curandGenerateUniformWrap(curandGenerator_t gen, double *ptr, size_t num) {
   return curandGenerateUniformDouble(gen, ptr, num);
 }

 template<typename Real>
 curandStatus_t curandGenerateNormalWrap(
     curandGenerator_t gen, Real *ptr, size_t num);
 //
 template<>
 curandStatus_t curandGenerateNormalWrap<float>(
     curandGenerator_t gen, float *ptr, size_t num) {
   return curandGenerateNormal(gen, ptr, num, 0.0 /*mean*/, 1.0 /*stddev*/);
 }
 template<>
 curandStatus_t curandGenerateNormalWrap<double>(
     curandGenerator_t gen, double *ptr, size_t num) {
   return curandGenerateNormalDouble(gen, ptr, num, 0.0 /*mean*/, 1.0 /*stddev*/);
 }
 #endif


 template<typename Real>
 void CuRand<Real>::RandUniform(CuMatrixBase<Real> *tgt) {
 #if HAVE_CUDA == 1
   if (CuDevice::Instantiate().Enabled()) {
     CuTimer tim;
     // Better use 'tmp' matrix, 'tgt' can be a window into a larger matrix,
     // so we should not use it to generate random numbers over whole stride.
     // Use the option kStrideEqualNumCols to ensure consistency
     // (because when memory is nearly exhausted, the stride of CudaMallocPitch
     // may vary).
     CuMatrix<Real> tmp(tgt->NumRows(), tgt->NumCols(), kUndefined,
                        kStrideEqualNumCols);
     size_t s = static_cast<size_t>(tmp.NumRows()) * static_cast<size_t>(tmp.Stride());
     CURAND_SAFE_CALL(curandGenerateUniformWrap(
           GetCurandHandle(), tmp.Data(), s));
     tgt->CopyFromMat(tmp);
     CuDevice::Instantiate().AccuProfile(__func__, tim);
   } else
 #endif
   {
     tgt->Mat().SetRandUniform();
   }
 }

 template<typename Real>
 void CuRand<Real>::RandUniform(CuMatrix<Real> *tgt) {
 #if HAVE_CUDA == 1
   if (CuDevice::Instantiate().Enabled()) {
     CuTimer tim;
     // Here we don't need to use 'tmp' matrix,
     size_t s = static_cast<size_t>(tgt->NumRows()) * static_cast<size_t>(tgt->Stride());
     CURAND_SAFE_CALL(curandGenerateUniformWrap(
           GetCurandHandle(), tgt->Data(), s));
     CuDevice::Instantiate().AccuProfile(__func__, tim);
   } else
 #endif
   {
     tgt->Mat().SetRandUniform();
   }
 }

 template<typename Real>
 void CuRand<Real>::RandUniform(CuVectorBase<Real> *tgt) {
 #if HAVE_CUDA == 1
   if (CuDevice::Instantiate().Enabled()) {
     CuTimer tim;
     CURAND_SAFE_CALL(curandGenerateUniformWrap(
           GetCurandHandle(), tgt->Data(), tgt->Dim()));
     CuDevice::Instantiate().AccuProfile(__func__, tim);
   } else
 #endif
   {
     tgt->Vec().SetRandUniform();
   }
 }

 template<typename Real>
 void CuRand<Real>::RandGaussian(CuMatrixBase<Real> *tgt) {
 #if HAVE_CUDA == 1
   if (CuDevice::Instantiate().Enabled()) {
     CuTimer tim;
     // Better use 'tmp' matrix, 'tgt' can be a window into a larger matrix,
     // so we should not use it to generate random numbers over whole stride.
     // Also, we ensure to have 'even' number of elements for calling 'curand'
     // by possibly adding one column. Even number of elements is required by
     // curandGenerateUniform(), curandGenerateUniformDouble().
     // Use the option kStrideEqualNumCols to ensure consistency
     // (because when memory is nearly exhausted, the stride of CudaMallocPitch
     // may vary).
     MatrixIndexT num_cols_even = tgt->NumCols() + (tgt->NumCols() % 2); // + 0 or 1,
     CuMatrix<Real> tmp(tgt->NumRows(), num_cols_even, kUndefined,
                        kStrideEqualNumCols);
     CURAND_SAFE_CALL(curandGenerateNormalWrap(
           GetCurandHandle(), tmp.Data(), tmp.NumRows()*tmp.Stride()));
     tgt->CopyFromMat(tmp.ColRange(0,tgt->NumCols()));
     CuDevice::Instantiate().AccuProfile(__func__, tim);
   } else
 #endif
   {
     tgt->Mat().SetRandn();
   }
 }

 template<typename Real>
 void CuRand<Real>::RandGaussian(CuMatrix<Real> *tgt) {
 #if HAVE_CUDA == 1
   if (CuDevice::Instantiate().Enabled()) {
     CuTimer tim;
     // Here we don't need to use 'tmp' matrix, if the number of elements is even,
     MatrixIndexT num_elements = tgt->NumRows() * tgt->Stride();
     if (0 == (num_elements % 2)) {
       CURAND_SAFE_CALL(curandGenerateNormalWrap(
             GetCurandHandle(), tgt->Data(), num_elements));
     } else {
       // We use 'tmp' matrix with one column added, this guarantees an even
       // number of elements.  Use the option kStrideEqualNumCols to ensure
       // consistency (because when memory is nearly exhausted, the stride of
       // CudaMallocPitch may vary).
       MatrixIndexT num_cols_even = tgt->NumCols() + (tgt->NumCols() % 2); // + 0 or 1,
       CuMatrix<Real> tmp(tgt->NumRows(), num_cols_even, kUndefined,
                          kStrideEqualNumCols);
       CURAND_SAFE_CALL(curandGenerateNormalWrap(
             GetCurandHandle(), tmp.Data(), tmp.NumRows() * tmp.Stride()));
       tgt->CopyFromMat(tmp.ColRange(0,tgt->NumCols()));
     }
     CuDevice::Instantiate().AccuProfile(__func__, tim);
   } else
 #endif
   {
     tgt->Mat().SetRandn();
   }
 }

 template<typename Real>
 void CuRand<Real>::RandGaussian(CuVectorBase<Real> *tgt) {
 #if HAVE_CUDA == 1
   if (CuDevice::Instantiate().Enabled()) {
     CuTimer tim;
     // To ensure 'even' number of elements, we use 'tmp' vector of even length.
     // Even number of elements is required by 'curand' functions:
     // curandGenerateUniform(), curandGenerateUniformDouble().
     MatrixIndexT num_elements = tgt->Dim();
     if (0 == (num_elements % 2)) {
       CURAND_SAFE_CALL(curandGenerateNormalWrap(
             GetCurandHandle(), tgt->Data(), tgt->Dim()));
     } else {
       MatrixIndexT dim_even = tgt->Dim() + (tgt->Dim() % 2); // + 0 or 1,
       CuVector<Real> tmp(dim_even, kUndefined);
       CURAND_SAFE_CALL(curandGenerateNormalWrap(
             GetCurandHandle(), tmp.Data(), tmp.Dim()));
       tgt->CopyFromVec(tmp.Range(0,tgt->Dim()));
     }
     CuDevice::Instantiate().AccuProfile(__func__, tim);
   } else
 #endif
   {
     tgt->Vec().SetRandn();
   }
 }

 template<typename Real>
 void CuRand<Real>::BinarizeProbs(const CuMatrix<Real> &probs, CuMatrix<Real> *states) {
   CuMatrix<Real> tmp(probs.NumRows(), probs.NumCols());
   this->RandUniform(&tmp);  // [0..1]
   tmp.Scale(-1.0);  // [-1..0]
   tmp.AddMat(1.0, probs);  // [-1..+1]
   states->Heaviside(tmp);  // negative
 }

 template<typename Real>
 void CuRand<Real>::AddGaussNoise(CuMatrix<Real> *tgt, Real gscale) {
   // Use the option kStrideEqualNumCols to ensure consistency (because when
   // memory is nearly exhausted, the stride of CudaMallocPitch may vary).
   CuMatrix<Real> tmp(tgt->NumRows(), tgt->NumCols(),
                      kUndefined, kStrideEqualNumCols);
   this->RandGaussian(&tmp);
   tgt->AddMat(gscale, tmp);
 }

 // explicit instantiation,
 template class CuRand<float>;
 template class CuRand<double>;

 }  // namespace,
kaldi::CuMatrixBase::Mat
const MatrixBase< Real > & Mat() const
Definition: cu-matrix.h:755

kaldi::CuRand< float >

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::CuMatrixBase::Stride
MatrixIndexT Stride() const
Definition: cu-matrix.h:217

cu-rand.h

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::kStrideEqualNumCols
Definition: matrix-common.h:46

kaldi::RandUniform
float RandUniform(struct RandomState *state=NULL)
Returns a random number strictly between 0 and 1.
Definition: kaldi-math.h:151

kaldi::CuRand::RandUniform
void RandUniform(CuMatrixBase< Real > *tgt)
Fill with uniform [0..1] floats,.
Definition: cu-rand.cc:60

kaldi::CuRand::BinarizeProbs
void BinarizeProbs(const CuMatrix< Real > &probs, CuMatrix< Real > *states)
align probabilities to discrete 0/1 states (use uniform sampling),
Definition: cu-rand.cc:201

kaldi::CuMatrixBase::AddMat
void AddMat(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType trans=kNoTrans)
*this += alpha * A
Definition: cu-matrix.cc:954

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::CuRand::AddGaussNoise
void AddGaussNoise(CuMatrix< Real > *tgt, Real gscale=1.0)
add gaussian noise to each element,
Definition: cu-rand.cc:211

kaldi::CuRand::RandGaussian
void RandGaussian(CuMatrixBase< Real > *tgt)
Fill with Normal random numbers,.
Definition: cu-rand.cc:116

kaldi::MatrixIndexT
int32 MatrixIndexT
Definition: matrix-common.h:98

kaldi::CuVectorBase::CopyFromVec
void CopyFromVec(const CuVectorBase< Real > &src)
Copy functions; these will crash if the dimension do not match.
Definition: cu-vector.cc:1078

kaldi::CuMatrixBase::Heaviside
void Heaviside(const CuMatrixBase< Real > &src)
Set each element to the Heaviside function of the corresponding element of "src", which we define as ...
Definition: cu-matrix.cc:2435

kaldi::CuMatrixBase::Data
const Real * Data() const
Return data pointer (const).
Definition: cu-matrix.h:746

kaldi::CuVectorBase::Range
CuSubVector< Real > Range(const MatrixIndexT o, const MatrixIndexT l)
Definition: cu-vector.h:160

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::CuVectorBase::Vec
const VectorBase< Real > & Vec() const
Definition: cu-vector.h:235

kaldi::CuVectorBase::Data
Real * Data()
Returns a pointer to the start of the vector&#39;s data.
Definition: cu-vector.h:72

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::CuMatrix::Mat
const Matrix< Real > & Mat() const
Definition: cu-matrix.h:879

kaldi::CuVectorBase::Dim
MatrixIndexT Dim() const
Dimensions.
Definition: cu-vector.h:69

kaldi::CuVectorBase
Vector for CUDA computing.
Definition: matrix-common.h:72