doc/cu-device-test_8cc_source.html

 // cudamatrix/cu-device-test.cc

 // Copyright 2015  Johns Hopkins University (author: Daniel Povey)

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #include <iostream>
 #include <vector>
 #include <cstdlib>

 #include "base/kaldi-common.h"
 #include "util/common-utils.h"
 #include "cudamatrix/cu-matrix.h"
 #include "cudamatrix/cu-vector.h"

 using namespace kaldi;


 namespace kaldi {


 template<typename Real>
 std::string NameOf() {
   return (sizeof(Real) == 8 ? "<double>" : "<float>");
 }

 template<typename Real> void TestCuMatrixResize(int32 size_multiple) {
   int32 num_matrices = 256;
   BaseFloat time_in_secs = 0.2;

   std::vector<std::pair<int32, int32> > sizes(num_matrices);

   for (int32 i = 0; i < num_matrices; i++) {
     int32 num_rows = RandInt(1, 10);
     num_rows *= num_rows;
     num_rows *= size_multiple;
     int32 num_cols = RandInt(1, 10);
     num_cols *= num_cols;
     num_cols *= size_multiple;
     sizes[i].first = num_rows;
     sizes[i].second = num_rows;
   }

   std::vector<CuMatrix<BaseFloat> > matrices(num_matrices);

   Timer tim;
   size_t num_floats_processed = 0;
   for (;tim.Elapsed() < time_in_secs; ) {
     int32 matrix = RandInt(0, num_matrices - 1);
     if (matrices[matrix].NumRows() == 0) {
       int32 num_rows = sizes[matrix].first,
           num_cols = sizes[matrix].second;
       matrices[matrix].Resize(num_rows, num_cols, kUndefined);
       num_floats_processed += num_rows * num_cols;
     } else {
       matrices[matrix].Resize(0, 0);
     }
   }

   BaseFloat gflops = num_floats_processed / (tim.Elapsed() * 1.0e+09);

   KALDI_LOG << "For CuMatrix::Resize" << NameOf<Real>() << ", for size_multiple = "
             << size_multiple << ", speed was " << gflops << " gigaflops.";
 }

 template <typename Real>
 void CudaMatrixResizeTest() {
   std::vector<int32> sizes;
   sizes.push_back(1);
   sizes.push_back(2);
   sizes.push_back(4);
   sizes.push_back(8);
   sizes.push_back(16);
   //sizes.push_back(24);
   //sizes.push_back(32);
   //sizes.push_back(40);

   int32 ns = sizes.size();
   for (int32 s = 0; s < ns; s++)
     TestCuMatrixResize<Real>(sizes[s]);
 }


 } // namespace kaldi


 int main() {
   SetVerboseLevel(1);
 #if HAVE_CUDA == 1
   for (int32 loop = 0; loop < 2; loop++) {
     CuDevice::Instantiate().SetDebugStrideMode(true);
     if (loop == 0)
       CuDevice::Instantiate().SelectGpuId("no");
     else
       CuDevice::Instantiate().SelectGpuId("yes");
 #endif

     kaldi::CudaMatrixResizeTest<float>();
 #if HAVE_CUDA == 1
     if (CuDevice::Instantiate().DoublePrecisionSupported()) {
       kaldi::CudaMatrixResizeTest<double>();
     } else {
       KALDI_WARN << "Double precision not supported";
     }
 #else
     kaldi::CudaMatrixResizeTest<double>();
 #endif

 #if HAVE_CUDA == 1
   }
   CuDevice::Instantiate().PrintProfile();
 #endif
   KALDI_LOG << "Tests succeeded.";
 }
kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::CudaMatrixResizeTest
void CudaMatrixResizeTest()
Definition: cu-device-test.cc:81

kaldi::TestCuMatrixResize
void TestCuMatrixResize(int32 size_multiple)
Definition: cu-device-test.cc:41

kaldi::NameOf
std::string NameOf()
Definition: matrix-lib-speed-test.cc:30

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

common-utils.h

cu-matrix.h

cu-vector.h

kaldi::SetVerboseLevel
void SetVerboseLevel(int32 i)
This should be rarely used, except by programs using Kaldi as library; command-line programs set the ...
Definition: kaldi-error.h:64

float

main
int main()
Definition: cu-device-test.cc:101

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::Timer
Definition: timer.h:63

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

KALDI_LOG
#define KALDI_LOG
Definition: kaldi-error.h:153

kaldi::Timer::Elapsed
double Elapsed() const
Returns time in seconds.
Definition: timer.h:74

kaldi-common.h

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95