doc/cu-compressed-matrix_8cc_source.html

 // cudamatrix/cu-compressed-matrix.cc

 // Copyright      2018  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #if HAVE_CUDA == 1
 #include <cuda_runtime_api.h>
 #include <cublas_v2.h>
 #endif

 #include "base/timer.h"
 #include "cudamatrix/cu-common.h"
 #include "cudamatrix/cu-vector.h"
 #include "cudamatrix/cu-device.h"
 #include "cudamatrix/cu-kernels.h"
 #include "cudamatrix/cu-array.h"
 #include "cudamatrix/cu-compressed-matrix.h"

 namespace kaldi {


 template <typename I>
 CuCompressedMatrix<I>::CuCompressedMatrix(BaseFloat range, bool truncate):
     data_(NULL), scale_(range / std::numeric_limits<I>::max()),
     truncate_(truncate), num_rows_(0), num_cols_(0), stride_(0) {
 #if HAVE_CUDA == 1
   KALDI_ASSERT(CuDevice::Instantiate().Enabled());
 #else
   KALDI_ERR << "You instantiated CuCompressedMatrix while GPU use "
       "was not compiled in.";
 #endif
 }

 template <typename I>
 void CuCompressedMatrix<I>::Destroy() {
 #if HAVE_CUDA == 1
   if (data_ != NULL) {
     // we don't bother timing this because Free() won't normally have to
     // access the GPU at all (due to caching).
     CuDevice::Instantiate().Free(data_);
     data_ = NULL;
     num_rows_ = 0;
     num_cols_ = 0;
     stride_ = 0;
   }
 #endif
 }

 template <typename I>
 void CuCompressedMatrix<I>::CopyFromMat(
     const CuMatrixBase<BaseFloat> &mat) {
 #if HAVE_CUDA == 1
   KALDI_ASSERT(CuDevice::Instantiate().Enabled());
   if (mat.NumRows() == 0)
     return;
   if (num_rows_ != mat.NumRows() || num_cols_ != mat.NumCols()) {
     Destroy();
     num_rows_ = mat.NumRows();
     num_cols_ = mat.NumCols();
     data_ = static_cast<I*>(
         CuDevice::Instantiate().Malloc(sizeof(I) * num_rows_ * num_cols_));
     stride_ = num_cols_;
   }

   {
     CuTimer tim;
     dim3 dimGrid, dimBlock;
     GetBlockSizesForSimpleMatrixOperation(NumRows(), NumCols(),
                                           &dimGrid, &dimBlock);

     if (scale_ == 0.0) { // scale == 0 calls a different kernel from the others.
       cuda_mat_compress_sign(dimGrid, dimBlock, mat.Data(), mat.Dim(),
                              data_, stride_);
     } else {
       cuda_mat_compress(dimGrid, dimBlock, mat.Data(), mat.Dim(),
                         data_, stride_, float(1.0 / scale_),
                         truncate_);
     }
     CU_SAFE_CALL(cudaGetLastError());

     CuDevice::Instantiate().AccuProfile(__func__, tim);
   }
 #endif
 }

 template <typename I>
 void CuCompressedMatrix<I>::CopyToMat(CuMatrixBase<BaseFloat> *mat) const {
 #if HAVE_CUDA == 1
   KALDI_ASSERT(CuDevice::Instantiate().Enabled());
   KALDI_ASSERT(mat->NumRows() == num_rows_ && mat->NumCols() == num_cols_);
   {
     CuTimer tim;
     dim3 dimGrid, dimBlock;
     GetBlockSizesForSimpleMatrixOperation(NumRows(), NumCols(),
                                           &dimGrid, &dimBlock);
     BaseFloat scale = (scale_ == 0.0 ? 1.0 : scale_);
     cuda_mat_uncompress(dimGrid, dimBlock, mat->Data(), mat->Dim(),
                         data_, stride_, float(scale));
   }
 #endif
 }


 CuCompressedMatrixBase *NewCuCompressedMatrix(CuCompressedMatrixType t,
                                               BaseFloat range,
                                               bool truncat) {
   if (t == kCompressedMatrixUint8) {
     KALDI_ASSERT(range >= 0);
     return new CuCompressedMatrix<uint8>(range);
   } else if (t == kCompressedMatrixInt8) {
     KALDI_ASSERT(range >= 0);
     return new CuCompressedMatrix<int8>(range);
   } else if (t == kCompressedMatrixUint16) {
     KALDI_ASSERT(range > 0);
     return new CuCompressedMatrix<uint16>(range);
   } else if (t == kCompressedMatrixInt16) {
     KALDI_ASSERT(range > 0);
     return new CuCompressedMatrix<int16>(range);
   } else {
     KALDI_ERR << "Unknown compressed-matrix type";
     return NULL;
   }
 }


 } // namespace kaldi
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::CuCompressedMatrix::stride_
MatrixIndexT stride_
Definition: cu-compressed-matrix.h:132

cu-device.h

kaldi::CuCompressedMatrix::num_cols_
MatrixIndexT num_cols_
Definition: cu-compressed-matrix.h:129

kaldi::CuCompressedMatrix::num_rows_
MatrixIndexT num_rows_
Definition: cu-compressed-matrix.h:128

cu-compressed-matrix.h

kaldi::CuCompressedMatrix::CopyToMat
virtual void CopyToMat(CuMatrixBase< BaseFloat > *mat) const
Copies the contents of *this to &#39;mat&#39;, which should be correctly sized beforehand.
Definition: cu-compressed-matrix.cc:102

kaldi::CuCompressedMatrix::scale_
BaseFloat scale_
Definition: cu-compressed-matrix.h:117

cu-vector.h

data_
uint64 data_
Definition: arpa-lm-compiler.cc:108

timer.h

kaldi::CuCompressedMatrix::NumRows
virtual MatrixIndexT NumRows() const
Definition: cu-compressed-matrix.h:94

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::CuCompressedMatrix::truncate_
bool truncate_
Definition: cu-compressed-matrix.h:126

kaldi::CuCompressedMatrix::CuCompressedMatrix
CuCompressedMatrix(BaseFloat range, bool truncate=true)
Constructor which sets &#39;scale_&#39; according to scale_ = range / std::numeric_limits<I>::max().
Definition: cu-compressed-matrix.cc:38

kaldi::CuCompressedMatrix::CopyFromMat
virtual void CopyFromMat(const CuMatrixBase< BaseFloat > &mat)
Sets *this to an appropriately compressed copy of &#39;mat&#39;, which includes resizing *this.
Definition: cu-compressed-matrix.cc:65

float

kaldi::kCompressedMatrixInt16
Definition: cu-compressed-matrix.h:143

kaldi::CuCompressedMatrix::Destroy
void Destroy()
Definition: cu-compressed-matrix.cc:50

kaldi::kCompressedMatrixUint16
Definition: cu-compressed-matrix.h:144

kaldi::CuCompressedMatrix::data_
I * data_
Definition: cu-compressed-matrix.h:106

cu-kernels.h

kaldi::CuCompressedMatrixType
CuCompressedMatrixType
Definition: cu-compressed-matrix.h:140

kaldi::CuCompressedMatrix
Class CuCompressedMatrix, templated on an integer type (expected to be one of: int8, uint8, int16, uint16), this provides a way to approximate a CuMatrix in a more memory-efficient format.
Definition: cu-compressed-matrix.h:72

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::CuCompressedMatrix::NumCols
virtual MatrixIndexT NumCols() const
Definition: cu-compressed-matrix.h:96

kaldi::kCompressedMatrixUint8
Definition: cu-compressed-matrix.h:142

kaldi::CuMatrixBase::Data
const Real * Data() const
Return data pointer (const).
Definition: cu-matrix.h:746

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

cu-common.h

kaldi::CuMatrixBase::Dim
::MatrixDim Dim() const
Definition: cu-matrix.h:221

kaldi::kCompressedMatrixInt8
Definition: cu-compressed-matrix.h:141

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::CuCompressedMatrixBase
Class CuCompressedMatrixBase is an abstract base class that allows you to compress a matrix of type C...
Definition: cu-compressed-matrix.h:35

cu-array.h

kaldi::NewCuCompressedMatrix
CuCompressedMatrixBase * NewCuCompressedMatrix(CuCompressedMatrixType t, BaseFloat range, bool truncat)
This function allocates a new CuCompressedMatrix with type determined by t, and with the &#39;range&#39; and ...
Definition: cu-compressed-matrix.cc:119