doc/cu-sp-matrix-speed-test_8cc_source.html

 // cudamatrix/cu-sp-matrix-speed-test.cc

 // Copyright 2013  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #include <iostream>
 #include <vector>
 #include <cstdlib>

 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "cudamatrix/cu-matrix.h"
 #include "cudamatrix/cu-vector.h"
 #include "cudamatrix/cu-math.h"
 #include "cudamatrix/cu-sp-matrix.h"

 using namespace kaldi;


 namespace kaldi {

 template<typename Real>
 std::string NameOf() {
   return (sizeof(Real) == 8 ? "<double>" : "<float>");
 }

 template<typename Real>
 static void UnitTestCuSpMatrixInvert(int32 dim) {
   BaseFloat time_in_secs = 0.01;
   int32 iter = 0;
   Timer tim;
   CuSpMatrix<Real> A(dim);
   A.SetRandn();
   for (;tim.Elapsed() < time_in_secs; iter++) {
     KALDI_ASSERT(A.Trace() != 0.0); // true with probability 1...
     CuSpMatrix<Real> B(A);

     if (iter  > 0) {
       B.Invert();
     } else { // do some more testing...

       CuMatrix<Real> D(A);
       A.AddMat2(1.0, D, kTrans, 1.0);
       A.AddToDiag(0.1 * dim);

       CuMatrix<Real> C(B);
       B.AddMat2(1.0, C, kTrans, 1.0);
       B.AddToDiag(0.1 * dim);

       A.Invert();
       B.Invert();

       SpMatrix<Real> E(dim);
       B.CopyToSp(&E);

       SpMatrix<Real> A2(A);
       AssertEqual(A2, E);
     }
   }
   BaseFloat fdim = dim;
   BaseFloat gflops = (fdim * fdim * fdim * iter) / (tim.Elapsed() * 1.0e+09);
   KALDI_LOG << "For CuSpMatrix::Invert" << NameOf<Real>() << ", for dim = "
             << dim << ", speed was " << gflops << " gigaflops.";
 }


 template<typename Real>
 static void UnitTestCuSpMatrixCopyFromMat(int32 dim, SpCopyType copy_type) {
   BaseFloat time_in_secs = 0.01;
   int32 iter = 0;
   Timer tim;
   CuMatrix<Real> A(dim, dim);
   CuSpMatrix<Real> S(dim);

   for (;tim.Elapsed() < time_in_secs; iter++) {
     S.CopyFromMat(A, copy_type);
   }
   BaseFloat fdim = dim;
   BaseFloat gflops = (fdim * fdim * iter) / (tim.Elapsed() * 1.0e+09);
   KALDI_LOG << "For CuSpMatrix::CopyFromMat" << NameOf<Real>()
             << ", with copy-type "
             <<(copy_type == kTakeLower ? "kTakeLower" :
                (copy_type == kTakeUpper ? "kTakeUpper" :
                 "kTakeMeanAndCheck")) << " and dim = "
             << dim << ", speed was " << gflops << " gigaflops.";
 }


 template<typename Real> void CuSpMatrixSpeedTest() {
   std::vector<int32> sizes;
   sizes.push_back(16);
   sizes.push_back(32);
   sizes.push_back(64);
   sizes.push_back(128);
   sizes.push_back(256);
   sizes.push_back(512);
   sizes.push_back(1024);
   int32 ns = sizes.size();

   for (int32 s = 0; s < ns; s++) {
     UnitTestCuSpMatrixInvert<Real>(sizes[s]);
     UnitTestCuSpMatrixCopyFromMat<Real>(sizes[s], kTakeLower);
     UnitTestCuSpMatrixCopyFromMat<Real>(sizes[s], kTakeUpper);
     UnitTestCuSpMatrixCopyFromMat<Real>(sizes[s], kTakeMean);
   }
 }


 } // namespace kaldi


 int main() {
   SetVerboseLevel(1);
   //Select the GPU
 #if HAVE_CUDA == 1
   CuDevice::Instantiate().SelectGpuId("yes"); //-2 .. automatic selection
 #endif

   kaldi::CuSpMatrixSpeedTest<float>();
 #if HAVE_CUDA == 1
   if (CuDevice::Instantiate().DoublePrecisionSupported()) {
     kaldi::CuSpMatrixSpeedTest<double>();
   } else {
     KALDI_WARN << "Double precision not supported";
   }
 #else
   kaldi::CuSpMatrixSpeedTest<double>();
 #endif
 #if HAVE_CUDA == 1
   CuDevice::Instantiate().PrintProfile();
 #endif
   KALDI_LOG << "Tests succeeded.";
 }
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::SpMatrix
Packed symetric matrix class.
Definition: matrix-common.h:62

kaldi::CuPackedMatrix::Trace
Real Trace() const
Definition: cu-packed-matrix.cc:264

kaldi::NameOf
std::string NameOf()
Definition: matrix-lib-speed-test.cc:30

kaldi::CuPackedMatrix::AddToDiag
void AddToDiag(Real r)
< Set the diagonal value to alpha
Definition: cu-packed-matrix.cc:351

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

cu-matrix.h

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::CuSpMatrix::Invert
void Invert()
Note: the CuMatrix version of the Invert() function will only work for positive definite matrices; it...
Definition: cu-sp-matrix.cc:93

kaldi::CuSpMatrix
Definition: matrix-common.h:76

kaldi::CuPackedMatrix::SetRandn
void SetRandn()
< Set to unit matrix.
Definition: cu-packed-matrix.cc:75

cu-vector.h

kaldi::SpCopyType
SpCopyType
Definition: matrix-common.h:49

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::SetVerboseLevel
void SetVerboseLevel(int32 i)
This should be rarely used, except by programs using Kaldi as library; command-line programs set the ...
Definition: kaldi-error.h:64

cu-sp-matrix.h

float

main
int main()
Definition: cu-sp-matrix-speed-test.cc:130

kaldi::kTakeMean
Definition: matrix-common.h:52

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::Timer
Definition: timer.h:63

kaldi::CuSpMatrix::CopyFromMat
void CopyFromMat(const CuMatrixBase< Real > &orig, SpCopyType copy_type=kTakeLower)
Definition: cu-sp-matrix.cc:39

kaldi::CuSpMatrix::CopyToSp
void CopyToSp(SpMatrix< Real > *dst) const
Definition: cu-sp-matrix.h:95

cu-math.h

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::AssertEqual
static void AssertEqual(float a, float b, float relative_tolerance=0.001)
assert abs(a - b) <= relative_tolerance * (abs(a)+abs(b))
Definition: kaldi-math.h:276

kaldi::UnitTestCuSpMatrixInvert
static void UnitTestCuSpMatrixInvert(int32 dim)
Definition: cu-sp-matrix-speed-test.cc:43

kaldi::UnitTestCuSpMatrixCopyFromMat
static void UnitTestCuSpMatrixCopyFromMat(int32 dim, SpCopyType copy_type)
Definition: cu-sp-matrix-speed-test.cc:84

kaldi::CuSpMatrixSpeedTest
void CuSpMatrixSpeedTest()
Definition: cu-sp-matrix-speed-test.cc:107

kaldi::kTakeLower
Definition: matrix-common.h:50

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::Timer::Elapsed
double Elapsed() const
Returns time in seconds.
Definition: timer.h:74

kaldi-common.h

kaldi::CuSpMatrix::AddMat2
void AddMat2(const Real alpha, const CuMatrixBase< Real > &M, MatrixTransposeType transM, const Real beta)
Definition: cu-sp-matrix.cc:130

kaldi::kTakeUpper
Definition: matrix-common.h:51