doc/cu-matrix_8h_source.html

 // cudamatrix/cu-matrix.h

 // Copyright 2009-2012  Karel Vesely
 //                2013  Johns Hopkins University (author: Daniel Povey)
 //                2013  Hainan Xu
 //                2013  Xiaohui Zhang
 //           2013-2015  Guoguo Chen
 //                2017  Shiyin Kang
 //                2019  Yiwen Shao

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.


 #ifndef KALDI_CUDAMATRIX_CU_MATRIX_H_
 #define KALDI_CUDAMATRIX_CU_MATRIX_H_

 #include <sstream>
 #include <vector>

 #include "cudamatrix/cu-matrixdim.h"
 #include "cudamatrix/cu-common.h"
 #include "cudamatrix/cu-value.h"
 #include "matrix/matrix-common.h"
 #include "matrix/kaldi-matrix.h"
 #include "cudamatrix/cu-array.h"
 #include "cudamatrix/cu-math.h"
 #include "cudamatrix/cu-rand.h"
 #include "cudamatrix/cu-sparse-matrix.h"

 namespace kaldi {

 template<typename Real>
 Real TraceMatMat(const CuMatrixBase<Real> &A, const CuMatrixBase<Real> &B,
                  MatrixTransposeType trans = kNoTrans);

 template<typename Real>
 void AddMatMatBatched(const Real alpha, std::vector<CuSubMatrix<Real>* > &C,
                       const std::vector<CuSubMatrix<Real>* > &A,
                       MatrixTransposeType transA,
                       const std::vector<CuSubMatrix<Real>* > &B,
                       MatrixTransposeType transB,
                       const Real beta);

 /*
 template<typename Real>
 struct MatrixElement {
   int row;
   int column;
   Real weight;
 };
 // */

 template<typename Real>
 class CuMatrixBase {
  public:
   friend class CuMatrixBase<float>;
   friend class CuMatrixBase<double>;
   friend class CuVectorBase<float>;
   friend class CuVectorBase<double>;
   friend class VectorBase<Real>;
   friend class CuSpMatrix<Real>;
   friend class CuTpMatrix<float>;
   friend class CuTpMatrix<double>;
   friend class CuVectorBase<Real>;
   friend class CuSubMatrix<Real>;
   friend class CuRand<Real>;
   friend class CuSubVector<Real>;
   friend class CuBlockMatrix<Real>;
   friend class CuSparseMatrix<float>;
   friend class CuSparseMatrix<double>;
   friend class CuSparseMatrix<Real>;

   void CopyCols(const CuMatrixBase<Real> &src,
                 const CuArrayBase<MatrixIndexT> &indexes);


   void AddCols(const CuMatrixBase<Real> &src,
                const CuArrayBase<MatrixIndexT> &indices);

   void CopyRows(const CuMatrixBase<Real> &src,
                 const CuArrayBase<MatrixIndexT> &indexes);

   void CopyRows(const CuArrayBase<const Real*> &src);

   void CopyToRows(const CuArrayBase<Real*> &dst) const;

   void AddRows(Real alpha,
                const CuMatrixBase<Real> &src,
                const CuArrayBase<MatrixIndexT> &indexes);


   void MulRows(const CuMatrixBase<Real> &src,
                const CuArrayBase<MatrixIndexT> &indexes);


   void AddRows(Real alpha,
                const CuArrayBase<const Real*> &src);


   void AddToRows(Real alpha,
                  const CuArrayBase<MatrixIndexT> &indexes,
                  CuMatrixBase<Real> *dst) const;


   void AddToRows(Real alpha, const CuArrayBase<Real*> &dst) const;


   void SumColumnRanges(const CuMatrixBase<Real> &src,
                        const CuArrayBase<Int32Pair> &indexes);


   void AddRowRanges(const CuMatrixBase<Real> &src,
                     const CuArrayBase<Int32Pair> &indexes);


   friend Real TraceMatMat<Real>(const CuMatrixBase<Real> &A,
                                 const CuMatrixBase<Real> &B,
                                 MatrixTransposeType trans);

   friend Real TraceMatSmat<Real>(const CuMatrixBase<Real> &A,
                                  const CuSparseMatrix<Real> &B,
                                  MatrixTransposeType trans);

   friend void AddMatMatBatched<Real>(const Real alpha,
                                      std::vector<CuSubMatrix<Real>* > &C,
                                      const std::vector<CuSubMatrix<Real>* > &A,
                                      MatrixTransposeType transA,
                                      const std::vector<CuSubMatrix<Real>* > &B,
                                      MatrixTransposeType transB,
                                      const Real beta);

   void AddToDiag(Real value);

   MatrixIndexT NumRows() const { return num_rows_;  }
   MatrixIndexT NumCols() const { return num_cols_;  }
   MatrixIndexT Stride() const { return stride_; }

   // MatrixDim is a struct containing "rows", "cols" and "stride",
   // that is an argument of most CUDA kernels.
   ::MatrixDim Dim() const {
     ::MatrixDim d = { num_rows_, num_cols_, stride_ };
     return d;
   }

   Real FrobeniusNorm() const { return sqrt(TraceMatMat(*this, *this, kTrans)); }

   bool IsUnit(Real tol = 0.001) const;

   bool ApproxEqual(const CuMatrixBase<Real> &other, float tol = 0.01) const;

   MatrixIndexT SizeInBytes() const { return num_rows_*stride_*sizeof(Real); }

   // Copy functions.  These do not resize.
   template<typename OtherReal>
   void CopyFromMat(const MatrixBase<OtherReal> &src,
                    MatrixTransposeType trans = kNoTrans);


   void CopyFromGeneralMat(const GeneralMatrix &src,
                           MatrixTransposeType trans = kNoTrans);

   void CopyFromMat(const MatrixBase<Real> &src,
                    MatrixTransposeType trans = kNoTrans);

   void CopyFromSp(const CuSpMatrix<Real> &M);

   template<typename OtherReal>
   void CopyFromTp(const CuTpMatrix<OtherReal> &M,
                   MatrixTransposeType trans = kNoTrans);

   // This function will copy from source rows (start_range, end_range]
   // if the range is outside of the clamped region then the clamped
   // row will be replicated across the out of range areas
   void CopyRangeFromMatClamped(const CuMatrixBase<Real> & src,
       int32_t start_range, int32_t end_range,
       int32_t clamp_low, int32_t clamp_high);

   template<typename OtherReal>
   void CopyFromMat(const CuMatrixBase<OtherReal> &M,
                    MatrixTransposeType trans = kNoTrans);

   template<typename OtherReal>
   void CopyToMat(MatrixBase<OtherReal> *dst,
                  MatrixTransposeType trans = kNoTrans) const;

   void CopyRowsFromVec(const CuVectorBase<Real> &v);

   void CopyRowsFromVec(const VectorBase<Real> &v);

   void CopyColsFromVec(const CuVectorBase<Real> &v);

   void CopyColFromVec(const CuVectorBase<Real> &v, const MatrixIndexT col);

   void Sigmoid(const CuMatrixBase<Real> &src);

   void Heaviside(const CuMatrixBase<Real> &src);

   void Exp(const CuMatrixBase<Real> &src);

   void Log(const CuMatrixBase<Real> &src);

   void Pow(const CuMatrixBase<Real> &src, Real power);

   void PowAbs(const CuMatrixBase<Real> &src, Real power, bool include_sign=false);

   void Floor(const CuMatrixBase<Real> &src, Real floor_val);

   void Ceiling(const CuMatrixBase<Real> &src, Real ceiling_val);

   void ExpLimited(const CuMatrixBase<Real> &src, Real lower_limit, Real upper_limit);

   void ExpSpecial(const CuMatrixBase<Real> &src);

   void SoftMaxPerRow(const CuMatrixBase<Real> &src);

   void LogSoftMaxPerRow(const CuMatrixBase<Real> &src);


   void SoftHinge(const CuMatrixBase<Real> &src);

   void GroupPnorm(const CuMatrixBase<Real> &src, Real pow);

   void DiffGroupPnorm(const CuMatrixBase<Real> &in_value,
                       const CuMatrixBase<Real> &out_value,
                       const CuMatrixBase<Real> &out_deriv, Real power);

   void GroupMax(const CuMatrixBase<Real> &src);

   void GroupMaxDeriv(const CuMatrixBase<Real> &input,
                      const CuMatrixBase<Real> &output);

   void ParametricRelu(const CuMatrixBase<Real> &src,
                       const CuVectorBase<Real> &alpha,
                       const CuVectorBase<Real> &beta);

   void DiffParametricRelu(const CuMatrixBase<Real> &value,
                           const CuMatrixBase<Real> &diff,
                           const CuVectorBase<Real> &alpha,
                           const CuVectorBase<Real> &beta);

   void Tanh(const CuMatrixBase<Real> &src);

   void DiffSigmoid(const CuMatrixBase<Real> &value,
                    const CuMatrixBase<Real> &diff);

   void DiffTanh(const CuMatrixBase<Real> &value,
                 const CuMatrixBase<Real> &diff);

   void DiffSoftmaxPerRow(const CuMatrixBase<Real> &value,
                          const CuMatrixBase<Real> &diff);

   void DiffLogSoftmaxPerRow(const CuMatrixBase<Real> &out_value,
                             const CuMatrixBase<Real> &out_deriv);

   void DiffXent(const CuArrayBase<int32> &tgt,
                 CuVector<Real> *log_post_tgt);

   void Cholesky(CuMatrixBase<Real> *inv_cholesky = NULL);


   void SymInvertPosDef();

   inline void ApplyPow(Real power) {
     this -> Pow(*this, power);
   };


   inline void ApplyPowAbs(Real power, bool include_sign=false) {
     this -> PowAbs(*this, power, include_sign);
   };

   inline void ApplyHeaviside() {
     this -> Heaviside(*this);
   };

   inline void ApplyFloor(Real floor_val) {
     this -> Floor(*this, floor_val);
   };

   inline void ApplyCeiling(Real ceiling_val) {
     this -> Ceiling(*this, ceiling_val);
   };

   inline void ApplyExp() {
     this -> Exp(*this);
   };


   inline void ApplyExpLimited(Real lower_limit, Real upper_limit) {
     this -> ExpLimited(*this, lower_limit, upper_limit);
   };

   inline void ApplyExpSpecial() {
     this -> ExpSpecial(*this);
   };

   inline void ApplySoftMaxPerRow() {
     this -> SoftMaxPerRow(*this);
   };

   inline void ApplyLogSoftMaxPerRow() {
     this -> LogSoftMaxPerRow(*this);
   };

   inline void ApplyLog() {
     this -> Log(*this);
   };

   void FindRowMaxId(CuArray<int32> *id) const;

   void SetZero();
   void Set(Real value);
   void Add(Real value);
   void SetZeroAboveDiag();
   void Scale(Real value);

   void MulElements(const CuMatrixBase<Real> &A);
   void DivElements(const CuMatrixBase<Real> &A);
   void Max(const CuMatrixBase<Real> &A);
   void Min(const CuMatrixBase<Real> &A);
   void MulColsVec(const CuVectorBase<Real> &scale);
   void MulRowsVec(const CuVectorBase<Real> &scale);
   void MulRowsGroupMat(const CuMatrixBase<Real> &src);
   void DivRowsVec(const CuVectorBase<Real> &div);
   void InvertElements();
   void AddMat(Real alpha, const CuMatrixBase<Real> &A,
               MatrixTransposeType trans = kNoTrans);

   void AddSmat(Real alpha, const CuSparseMatrix<Real> &A,
               MatrixTransposeType trans = kNoTrans);

   void AddSmatMat(Real alpha, const CuSparseMatrix<Real> &A,
                   MatrixTransposeType transA, const CuMatrixBase<Real> &B,
                   Real beta);

   void AddMatSmat(Real alpha, const CuMatrixBase<Real> &A,
                   const CuSparseMatrix<Real> &B, MatrixTransposeType transB,
                   Real beta);


   void AddToElements(Real alpha, const CuArrayBase<int32> &elements);


   void AddMatBlocks(Real alpha, const CuMatrixBase<Real> &A,
                     MatrixTransposeType trans = kNoTrans);

   void AddVecToCols(Real alpha, const CuVectorBase<Real> &col, Real beta = 1.0);
   void AddVecToRows(Real alpha, const CuVectorBase<Real> &row, Real beta = 1.0);
   void AddMatMat(Real alpha, const CuMatrixBase<Real> &A, MatrixTransposeType transA,
                  const CuMatrixBase<Real> &B, MatrixTransposeType transB, Real beta);
   void AddVecVec(Real alpha, const CuVectorBase<Real> &x, const CuVectorBase<Real> &y);
   void SetMatMatDivMat(const CuMatrixBase<Real> &A, const CuMatrixBase<Real> &B, const CuMatrixBase<Real> &C);

   void SymAddMat2(const Real alpha, const CuMatrixBase<Real> &M,
                   MatrixTransposeType transA, Real beta);


   void AddMatBlock(Real alpha, const CuMatrixBase<Real> &A, MatrixTransposeType transA,
                    const CuBlockMatrix<Real> &B, MatrixTransposeType transB, Real beta);

   void AddDiagVecMat(const Real alpha, const CuVectorBase<Real> &v,
                      const CuMatrixBase<Real> &M, MatrixTransposeType transM,
                      Real beta = 1.0);

   // *this = beta * *this + alpha * M  * diag(v) [or M^T].
   // The same as adding M but scaling each column M_j by v(j).
   void AddMatDiagVec(const Real alpha,
                      const CuMatrixBase<Real> &M, MatrixTransposeType transM,
                      CuVectorBase<Real> &v,
                      Real beta = 1.0);

   void AddMatMatElements(const Real alpha,
                          const CuMatrixBase<Real>& A,
                          const CuMatrixBase<Real>& B,
                          const Real beta);

   void AddMatSp(const Real alpha,
                 const CuMatrixBase<Real> &A, MatrixTransposeType transA,
                 const CuSpMatrix<Real> &B,
                 const Real beta) {
     CuMatrix<Real> M(B);
     return AddMatMat(alpha, A, transA, M, kNoTrans, beta);
   }

   void AddSpMat(const Real alpha,
                 const CuSpMatrix<Real> &A,
                 const CuMatrixBase<Real> &B, MatrixTransposeType transB,
                 const Real beta) {
     CuMatrix<Real> M(A);
     return AddMatMat(alpha, M, kNoTrans, B, transB, beta);
   }

   void AddTpMat(const Real alpha,
                 const CuTpMatrix<Real> &A, MatrixTransposeType transA,
                 const CuMatrixBase<Real> &B, MatrixTransposeType transB,
                 const Real beta) {
     CuMatrix<Real> M(A);
     return AddMatMat(alpha, M, transA, B, transB, beta);
   }

   void AddMatTp(const Real alpha,
                 const CuMatrixBase<Real> &A, MatrixTransposeType transA,
                 const CuTpMatrix<Real> &B, MatrixTransposeType transB,
                 const Real beta) {
     CuMatrix<Real> M(B);
     return AddMatMat(alpha, A, transA, M, transB, beta);
   }

   void CopyFromBlock(const CuBlockMatrix<Real> &B,
                      MatrixTransposeType trans = kNoTrans);
   void CopyLowerToUpper();
   void CopyUpperToLower();
   inline CuSubMatrix<Real> Range(const MatrixIndexT row_offset,
                                  const MatrixIndexT num_rows,
                                  const MatrixIndexT col_offset,
                                  const MatrixIndexT num_cols) const {
     return CuSubMatrix<Real>(*this, row_offset, num_rows,
                              col_offset, num_cols);
   }
   inline CuSubMatrix<Real> RowRange(const MatrixIndexT row_offset,
                                     const MatrixIndexT num_rows) const {
     return CuSubMatrix<Real>(*this, row_offset, num_rows,
                              0, num_cols_);
   }
   inline CuSubMatrix<Real> ColRange(const MatrixIndexT col_offset,
                                     const MatrixIndexT num_cols) const {
     return CuSubMatrix<Real>(*this, 0, num_rows_, col_offset, num_cols);
   }

   inline const CuSubVector<Real> Row(MatrixIndexT i) const {
     KALDI_ASSERT(static_cast<UnsignedMatrixIndexT>(i) <
                  static_cast<UnsignedMatrixIndexT>(num_rows_));
     return CuSubVector<Real>(data_ + (i * stride_), NumCols());
   }

   inline CuSubVector<Real> Row(MatrixIndexT i) {
     KALDI_ASSERT(static_cast<UnsignedMatrixIndexT>(i) <
                  static_cast<UnsignedMatrixIndexT>(num_rows_));
     return CuSubVector<Real>(data_ + (i * stride_), NumCols());
   }

   inline CuValue<Real> operator() (MatrixIndexT r, MatrixIndexT c) {
     KALDI_PARANOID_ASSERT(static_cast<UnsignedMatrixIndexT>(r) <
                           static_cast<UnsignedMatrixIndexT>(num_rows_) &&
                           static_cast<UnsignedMatrixIndexT>(c) <
                           static_cast<UnsignedMatrixIndexT>(num_cols_));
     return CuValue<Real>(data_ + r * stride_ + c);
   }

   inline Real operator() (MatrixIndexT r, MatrixIndexT c) const {
     KALDI_PARANOID_ASSERT(static_cast<UnsignedMatrixIndexT>(r) <
                           static_cast<UnsignedMatrixIndexT>(num_rows_) &&
                           static_cast<UnsignedMatrixIndexT>(c) <
                           static_cast<UnsignedMatrixIndexT>(num_cols_));
     return CuValue<Real>(data_ + r * stride_ + c);  // will be casted to Real.
   }

   Real Sum() const;
   Real Max() const;
   Real Min() const;

   Real Trace(bool check_square = true) const;

   void SetRandn();

   void SetRandUniform();

   void Write(std::ostream &os, bool binary) const;

   // This function, adds a list of MatrixElements (scaled by alpha) to corresponding locations to
   // (*this).
   void AddElements(Real alpha, const std::vector<MatrixElement<Real> >& input);

   // For each i, with indexes[i] = (j, k), does (*this)(j, k) += input[i].
   // Requires, but does not check, that the vector of indexes does not contrain
   // repeated elements, 'input' is the start of an array of length equal to
   // indexes.Dim(), which is located on GPU memory if we are using the GPU.
   void AddElements(Real alpha, const CuArrayBase<Int32Pair> &indexes,
                    const Real *input);

   // This function requires that 'output' is a host array and is allocated with size
   // of indexes.size(), and for each element of 'indexes' it interprets it as
   // a (row, column) index into *this, and puts (*this)(row, column) into
   // the corresponding element of 'output'.
   void Lookup(const std::vector<Int32Pair> &indexes,
               Real *output) const;

   // CUDA version of Lookup, would be called internally by the above function.
   void Lookup(const CuArrayBase<Int32Pair> &indexes,
               Real *output) const;

   // Creates binary mask with per-element equality predicates of *this, mat.
   // Output stored to 'mask', values : 1.0 = equal, 0.0 = not-equal.
   void EqualElementMask(const CuMatrixBase<Real> &mat, CuMatrix<Real> *mask) const;


   inline const Real* RowData(MatrixIndexT r) const { return data_ + r * stride_; }
   inline Real* RowData(MatrixIndexT r) { return data_ + r * stride_; }
   inline const Real *Data() const { return data_; }
   inline Real *Data() { return data_; }

   // The following two functions should only be called if we did not compile
   // with CUDA or could not get a CUDA card; in that case the contents are
   // interpreted the same as a regular matrix.  DON'T USE THESE UNLESS YOU KNOW
   // WHAT YOU ARE DOING!
   inline const MatrixBase<Real> &Mat() const {
     return *(reinterpret_cast<const MatrixBase<Real>* >(this));
   }
   inline MatrixBase<Real> &Mat() {
     return *(reinterpret_cast<MatrixBase<Real>* >(this));
   }

  protected:

   // The constructors are protected to prevent the user creating an instance of
   // this class (you should create a child class CuMatrix or CuSubMatrix.

   CuMatrixBase(): data_(NULL), num_cols_(0), num_rows_(0), stride_(0) { }

   CuMatrixBase(Real *data,
                MatrixIndexT num_rows,
                MatrixIndexT num_cols,
                MatrixIndexT stride):
   data_(data), num_cols_(num_cols), num_rows_(num_rows), stride_(stride) { }

   Real *data_;
   // Note: it might seem a bit backwards that we have the number of columns
   // first here; it's necessary because we need the data to be laid out the same
   // as for MatrixBase so the Mat() function call will work.  We don't want to
   // change the layout of MatrixBase at this point, or there will be crashes if
   // people don't thoroughly recompile.
   MatrixIndexT num_cols_;
   MatrixIndexT num_rows_;
   MatrixIndexT stride_;

  private:
   KALDI_DISALLOW_COPY_AND_ASSIGN(CuMatrixBase);
 }; // class CuMatrixBase

 template<typename Real>
 class CuMatrix: public CuMatrixBase<Real> {
  public:

   CuMatrix() { }

   CuMatrix(MatrixIndexT rows, MatrixIndexT cols,
            MatrixResizeType resize_type = kSetZero,
            MatrixStrideType stride_type = kDefaultStride) {
     Resize(rows, cols, resize_type, stride_type);
   }

   // Note: we had to remove the "explicit" keyword due
   // to problems with STL vectors of CuMatrixBase.
   CuMatrix(const CuMatrix<Real> &other,
            MatrixTransposeType trans = kNoTrans);

   explicit CuMatrix(const CuBlockMatrix<Real> &other,
                     MatrixTransposeType trans = kNoTrans);

   explicit CuMatrix(const CuMatrixBase<Real> &other,
                     MatrixTransposeType trans = kNoTrans);

   template<typename OtherReal>
   explicit CuMatrix(const MatrixBase<OtherReal> &other,
                     MatrixTransposeType trans = kNoTrans);

   explicit CuMatrix(const CuSpMatrix<Real> &M) : CuMatrixBase<Real>() {
     Resize(M.NumRows(), M.NumRows(), kUndefined);
     this->CopyFromSp(M);
   }

   template <typename OtherReal>
   explicit CuMatrix(const CuTpMatrix<OtherReal> & M,
                     MatrixTransposeType trans = kNoTrans) : CuMatrixBase<Real>() {
     Resize(M.NumCols(), M.NumRows(), kUndefined);
     this->CopyFromTp(M, trans);
   }

   template<typename OtherReal>
   explicit CuMatrix(const CuMatrixBase<OtherReal> &M,
                     MatrixTransposeType trans = kNoTrans);

   CuMatrix<Real> &operator = (const CuMatrixBase<Real> &other) {
     this->Resize(other.NumRows(), other.NumCols(), kUndefined);
     this->CopyFromMat(other);
     return *this;
   }

   CuMatrix<Real> &operator = (const CuMatrix<Real> &other) {
     this->Resize(other.NumRows(), other.NumCols(), kUndefined);
     this->CopyFromMat(other);
     return *this;
   }

   CuMatrix<Real> &operator = (const MatrixBase<Real> &other) {
     this->Resize(other.NumRows(), other.NumCols(), kUndefined);
     this->CopyFromMat(other);
     return *this;
   }

   void Transpose();

   void Resize(MatrixIndexT rows, MatrixIndexT cols,
               MatrixResizeType resize_type = kSetZero,
               MatrixStrideType stride_type = kDefaultStride);

   void Swap(Matrix<Real> *mat);
   void Swap(CuMatrix<Real> *mat);

   template<typename OtherReal>
   void Swap(CuMatrix<OtherReal> *mat);

   void Read(std::istream &is, bool binary);

   ~CuMatrix() { Destroy(); }

   inline const Matrix<Real> &Mat() const {
     return *(reinterpret_cast<const Matrix<Real>* >(this));
   }
   inline Matrix<Real> &Mat() {
     return *(reinterpret_cast<Matrix<Real>* >(this));
   }

   void CompObjfAndDeriv(const std::vector<MatrixElement<Real> > &elements,
                         const CuMatrix<Real> &A,
                         Real *tot_objf,
                         Real *tot_weight);

  private:
   void Destroy();
 };


 template<typename Real>
 class CuSubMatrix: public CuMatrixBase<Real> {
  public:
   inline CuSubMatrix(const CuMatrixBase<Real> &mat,
                      const MatrixIndexT row_offset,
                      const MatrixIndexT num_rows,
                      const MatrixIndexT col_offset,
                      const MatrixIndexT num_cols);

   // This constructor should be used with caution; it can be used for
   // constructing 'fake' submatrices if you want to play with
   // the stride. 'data' should point to GPU data if you're using the
   // GPU.
   inline CuSubMatrix(const Real *data,
                      const MatrixIndexT num_rows,
                      const MatrixIndexT num_cols,
                      const MatrixIndexT stride);

   inline CuSubMatrix<Real> (const CuSubMatrix &other):
   CuMatrixBase<Real> (other.data_, other.num_rows_, other.num_cols_,
                       other.stride_) {}
  private:
   CuSubMatrix<Real> &operator = (const CuSubMatrix<Real> &other);
 };


 template<typename Real>
 bool ApproxEqual(const CuMatrixBase<Real> &A,
                  const CuMatrixBase<Real> &B, Real tol = 0.01) {
   return A.ApproxEqual(B, tol);
 }

 template<typename Real>
 inline void AssertEqual(const CuMatrixBase<Real> &A,
                         const CuMatrixBase<Real> &B, float tol = 0.01) {
   KALDI_ASSERT(A.ApproxEqual(B, tol));
 }

 template<typename Real>
 bool SameDim(const CuMatrixBase<Real> &M, const CuMatrixBase<Real> &N) {
   return (M.NumRows() == N.NumRows() && M.NumCols() == N.NumCols());
 }

 template<typename Real>
 bool SameDimAndStride(const CuMatrixBase<Real> &M, const CuMatrixBase<Real> &N) {
   return (M.NumRows() == N.NumRows() && M.NumCols() == N.NumCols()
           && M.Stride() == N.Stride());
 }

 template<typename Real>
 std::ostream &operator << (std::ostream &out, const CuMatrixBase<Real> &mat);


 template<typename Real>
 template<typename OtherReal>
 Matrix<Real>::Matrix(const CuMatrixBase<OtherReal> &M,
                      MatrixTransposeType trans) {
   if (trans == kNoTrans) Init(M.NumRows(), M.NumCols(), kDefaultStride);
   else Init(M.NumCols(), M.NumRows(), kDefaultStride);
   M.CopyToMat(this, trans);
 }

 template<typename Real>
 template<typename OtherReal>
 void MatrixBase<Real>::CopyFromMat(const CuMatrixBase<OtherReal> &cu,
                                    MatrixTransposeType trans) {
   cu.CopyToMat(this, trans);
 }


 }  // namespace


 #include "cudamatrix/cu-matrix-inl.h"

 #endif
kaldi::CuMatrixBase::Mat
const MatrixBase< Real > & Mat() const
Definition: cu-matrix.h:755

kaldi::CuMatrixBase::Row
CuSubVector< Real > Row(MatrixIndexT i)
Definition: cu-matrix.h:676

kaldi::CuRand
Definition: cu-common.h:152

kaldi::CuMatrixBase::Mat
MatrixBase< Real > & Mat()
Definition: cu-matrix.h:758

kaldi::CuMatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:344

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::CuMatrixBase::Stride
MatrixIndexT Stride() const
Definition: cu-matrix.h:217

kaldi::CuMatrixBase::Data
Real * Data()
Return data pointer.
Definition: cu-matrix.h:749

kaldi::Matrix::Matrix
Matrix()
Empty constructor.
Definition: kaldi-matrix-inl.h:29

kaldi::CuMatrixBase::ApplyCeiling
void ApplyCeiling(Real ceiling_val)
Definition: cu-matrix.h:455

cu-rand.h

kaldi::GeneralMatrix
This class is a wrapper that enables you to store a matrix in one of three forms: either as a Matrix<...
Definition: sparse-matrix.h:282

kaldi::CuMatrixBase::SoftHinge
void SoftHinge(const CuMatrixBase< Real > &src)
Apply the function y = log(1 + exp(x)), to each element.
Definition: cu-matrix.cc:1555

kaldi::CuMatrixBase::ApplyPow
void ApplyPow(Real power)
Definition: cu-matrix.h:438

kaldi::kUndefined
Definition: matrix-common.h:39

kaldi::CuMatrixBase::Trace
Real Trace(bool check_square=true) const
Return the trace. If check_square = true, will crash if matrix is not square.
Definition: cu-matrix.cc:3075

kaldi::MatrixResizeType
MatrixResizeType
Definition: matrix-common.h:37

kaldi::CuMatrixBase::GroupMax
void GroupMax(const CuMatrixBase< Real > &src)
Apply the function y(i) = (max_{j = i*G}^{(i+1)*G-1} x_j where G = x.NumCols() / y.NumCols() must be an integer.
Definition: cu-matrix.cc:1617

kaldi::CuMatrixBase::Write
void Write(std::ostream &os, bool binary) const
Definition: cu-matrix.cc:502

kaldi::CuVector
Definition: matrix-common.h:74

kaldi::CuMatrixBase::Row
const CuSubVector< Real > Row(MatrixIndexT i) const
Definition: cu-matrix.h:670

kaldi::CuMatrixBase::CuMatrixBase
CuMatrixBase()
Definition: cu-matrix.h:767

kaldi::CuMatrixBase::ExpLimited
void ExpLimited(const CuMatrixBase< Real > &src, Real lower_limit, Real upper_limit)
This is equivalent to running: Floor(src, lower_limit); Ceiling(src, upper_limit); Exp(src) ...
Definition: cu-matrix.cc:2541

kaldi::CuMatrixBase::CopyUpperToLower
void CopyUpperToLower()
Definition: cu-matrix.cc:2990

kaldi::CuMatrixBase::AddSmatMat
void AddSmatMat(Real alpha, const CuSparseMatrix< Real > &A, MatrixTransposeType transA, const CuMatrixBase< Real > &B, Real beta)
(*this) = alpha * op(A) * B + beta * (*this), where A is sparse.
Definition: cu-matrix.cc:1024

kaldi::CuMatrixBase::CopyToMat
void CopyToMat(MatrixBase< OtherReal > *dst, MatrixTransposeType trans=kNoTrans) const
Definition: cu-matrix.cc:447

kaldi::CuMatrixBase::AddToElements
void AddToElements(Real alpha, const CuArrayBase< int32 > &elements)
This is a rather special purpose function; we might generalize it later by adding a transpose-type op...
Definition: cu-matrix.cc:3344

kaldi::CuPackedMatrix::NumRows
MatrixIndexT NumRows() const
Definition: cu-packed-matrix.h:135

kaldi::CuMatrixBase::AddMatTp
void AddMatTp(const Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType transA, const CuTpMatrix< Real > &B, MatrixTransposeType transB, const Real beta)
this <– beta*this + alpha*A*B.
Definition: cu-matrix.h:641

kaldi::MatrixBase::NumCols
MatrixIndexT NumCols() const
Returns number of columns (or zero for empty matrix).
Definition: kaldi-matrix.h:67

kaldi::MatrixBase
Base class which provides matrix operations not involving resizing or allocation. ...
Definition: kaldi-matrix.h:49

MatrixDim_
Structure containing size of the matrix plus stride.
Definition: cu-matrixdim.h:46

MatrixElement
Definition: cu-matrixdim.h:35

kaldi::CuMatrix::CuMatrix
CuMatrix(const CuSpMatrix< Real > &M)
Copy constructor taking SpMatrix...
Definition: cu-matrix.h:824

kaldi::CuMatrixBase::AddRows
void AddRows(Real alpha, const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Does for each row r, this.Row(r) += alpha * src.row(indexes[r]).
Definition: cu-matrix.cc:2766

kaldi::CuMatrixBase::AddRowRanges
void AddRowRanges(const CuMatrixBase< Real > &src, const CuArrayBase< Int32Pair > &indexes)
For each row r of this and for each column c, do (*this)(r, c) +=  src(j, c), where j ranges from ind...
Definition: cu-matrix.cc:2931

kaldi::CuMatrix::CuMatrix
CuMatrix(MatrixIndexT rows, MatrixIndexT cols, MatrixResizeType resize_type=kSetZero, MatrixStrideType stride_type=kDefaultStride)
Constructor with memory initialisation.
Definition: cu-matrix.h:802

kaldi::CuMatrixBase::AddElements
void AddElements(Real alpha, const std::vector< MatrixElement< Real > > &input)
Definition: cu-matrix.cc:3277

matrix-common.h

kaldi::CuMatrixBase::AddMatDiagVec
void AddMatDiagVec(const Real alpha, const CuMatrixBase< Real > &M, MatrixTransposeType transM, CuVectorBase< Real > &v, Real beta=1.0)
Definition: cu-matrix.cc:1415

kaldi::CuMatrixBase::Sum
Real Sum() const
Definition: cu-matrix.cc:3012

kaldi::CuMatrixBase::CopyRangeFromMatClamped
void CopyRangeFromMatClamped(const CuMatrixBase< Real > &src, int32_t start_range, int32_t end_range, int32_t clamp_low, int32_t clamp_high)
Definition: cu-matrix.cc:419

kaldi::CuMatrixBase::Range
CuSubMatrix< Real > Range(const MatrixIndexT row_offset, const MatrixIndexT num_rows, const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Definition: cu-matrix.h:653

kaldi-matrix.h

kaldi::CuMatrix::CuMatrix
CuMatrix(const CuTpMatrix< OtherReal > &M, MatrixTransposeType trans=kNoTrans)
Copy constructor taking TpMatrix...
Definition: cu-matrix.h:831

kaldi::CuMatrixBase::ApplyHeaviside
void ApplyHeaviside()
Definition: cu-matrix.h:447

kaldi::CuMatrixBase::ApplyFloor
void ApplyFloor(Real floor_val)
Definition: cu-matrix.h:451

kaldi::CuMatrixBase::SetRandn
void SetRandn()
Definition: cu-matrix.cc:3132

kaldi::CuMatrixBase::Log
void Log(const CuMatrixBase< Real > &src)
Definition: cu-matrix.cc:2477

kaldi::CuMatrixBase::AddMatBlock
void AddMatBlock(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType transA, const CuBlockMatrix< Real > &B, MatrixTransposeType transB, Real beta)
This function is like AddMatMat but for where the second argument is of type CuBlockMatrix (a block-d...
Definition: cu-matrix.cc:3205

kaldi::CuMatrix::Mat
Matrix< Real > & Mat()
Definition: cu-matrix.h:882

kaldi::CuMatrixBase::AddVecToCols
void AddVecToCols(Real alpha, const CuVectorBase< Real > &col, Real beta=1.0)
(for each column c of *this), c = alpha * col + beta * c
Definition: cu-matrix.cc:1232

kaldi::CuMatrixBase::Ceiling
void Ceiling(const CuMatrixBase< Real > &src, Real ceiling_val)
Definition: cu-matrix.cc:2601

kaldi::CuBlockMatrix
The class CuBlockMatrix holds a vector of objects of type CuMatrix, say, M_1, M_2, .
Definition: cu-block-matrix.h:51

kaldi::CuMatrixBase::AddMatSp
void AddMatSp(const Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType transA, const CuSpMatrix< Real > &B, const Real beta)
this <– beta*this + alpha*A*B
Definition: cu-matrix.h:614

kaldi::CuMatrixBase::AddSmat
void AddSmat(Real alpha, const CuSparseMatrix< Real > &A, MatrixTransposeType trans=kNoTrans)
*this += alpha * A.
Definition: cu-matrix.cc:985

kaldi::CuMatrixBase::AddToDiag
void AddToDiag(Real value)
Adds "value" to the diagonal elements of the matrix.
Definition: cu-matrix.cc:604

kaldi::CuMatrixBase::AddMat
void AddMat(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType trans=kNoTrans)
*this += alpha * A
Definition: cu-matrix.cc:954

kaldi::CuMatrixBase::DivRowsVec
void DivRowsVec(const CuVectorBase< Real > &div)
divide i&#39;th row by scale[i]
Definition: cu-matrix.cc:899

kaldi::Matrix
A class for storing matrices.
Definition: kaldi-matrix.h:823

kaldi::CuMatrixBase::AddMatMatElements
void AddMatMatElements(const Real alpha, const CuMatrixBase< Real > &A, const CuMatrixBase< Real > &B, const Real beta)
*this = beta * *this + alpha * A .* B (.* element by element multiplication)
Definition: cu-matrix.cc:1447

kaldi::CuMatrix
This class represents a matrix that&#39;s stored on the GPU if we have one, and in memory if not...
Definition: matrix-common.h:71

kaldi::CuMatrixBase::CopyRowsFromVec
void CopyRowsFromVec(const CuVectorBase< Real > &v)
This function has two modes of operation.
Definition: cu-matrix.cc:2301

kaldi::CuMatrixBase::data_
Real * data_
GPU data pointer (or regular matrix data pointer,.
Definition: cu-matrix.h:777

kaldi::CuMatrix::~CuMatrix
~CuMatrix()
Destructor.
Definition: cu-matrix.h:877

kaldi::MatrixBase::CopyFromMat
void CopyFromMat(const MatrixBase< OtherReal > &M, MatrixTransposeType trans=kNoTrans)
Copy given matrix. (no resize is done).
Definition: kaldi-matrix.cc:862

kaldi::CuMatrixBase::SizeInBytes
MatrixIndexT SizeInBytes() const
Get size of matrix in bytes.
Definition: cu-matrix.h:234

kaldi::CuSpMatrix
Definition: matrix-common.h:76

kaldi::CuMatrixBase::ApplyLog
void ApplyLog()
Definition: cu-matrix.h:480

kaldi::CuSubVector
Definition: matrix-common.h:73

kaldi::CuMatrixBase::AddCols
void AddCols(const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indices)
Add column indices[r] of src to column r.
Definition: cu-matrix.cc:2701

kaldi::CuMatrixBase::AddTpMat
void AddTpMat(const Real alpha, const CuTpMatrix< Real > &A, MatrixTransposeType transA, const CuMatrixBase< Real > &B, MatrixTransposeType transB, const Real beta)
this <– beta*this + alpha*A*B.
Definition: cu-matrix.h:632

kaldi::CuMatrixBase::stride_
MatrixIndexT stride_
Definition: cu-matrix.h:787

kaldi::CuMatrixBase::InvertElements
void InvertElements()
invert the matrix by elements.
Definition: cu-matrix.cc:932

kaldi::CuMatrixBase::ApproxEqual
bool ApproxEqual(const CuMatrixBase< Real > &other, float tol=0.01) const
True if ((*this)-other).FrobeniusNorm() <= tol * this->FrobeniusNorm()
Definition: cu-matrix.cc:2137

kaldi::CuMatrixBase::CopyColFromVec
void CopyColFromVec(const CuVectorBase< Real > &v, const MatrixIndexT col)
Copy vector into specific column of matrix.
Definition: cu-matrix.cc:2414

kaldi::CuMatrixBase::IsUnit
bool IsUnit(Real tol=0.001) const
Definition: cu-matrix.cc:629

kaldi::CuValue
The following class is used to simulate non-const references to Real, e.g.
Definition: cu-value.h:34

kaldi::CuMatrixBase::Floor
void Floor(const CuMatrixBase< Real > &src, Real floor_val)
Definition: cu-matrix.cc:2582

kaldi::CuMatrixBase::Lookup
void Lookup(const std::vector< Int32Pair > &indexes, Real *output) const
Definition: cu-matrix.cc:3370

kaldi::kTrans
Definition: matrix-common.h:33

kaldi::SameDim
bool SameDim(const MatrixBase< Real > &M, const MatrixBase< Real > &N)
Definition: kaldi-matrix.h:1111

kaldi::CuMatrixBase::AddMatBlocks
void AddMatBlocks(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType trans=kNoTrans)
This function is like AddMat (it does *this += alpha * src), except that it supports cases where *thi...
Definition: cu-matrix.cc:1119

kaldi::CuMatrixBase::Scale
void Scale(Real value)
Definition: cu-matrix.cc:644

kaldi::CuMatrix::CuMatrix
CuMatrix()
Definition: cu-matrix.h:799

kaldi::CuMatrixBase::SymInvertPosDef
void SymInvertPosDef()
Inversion for positive definite symmetric matrices.
Definition: cu-matrix.cc:2111

kaldi::CuMatrixBase::Pow
void Pow(const CuMatrixBase< Real > &src, Real power)
Definition: cu-matrix.cc:2500

kaldi::AddMatMatBatched
void AddMatMatBatched(const Real alpha, std::vector< CuSubMatrix< Real > * > &C, const std::vector< CuSubMatrix< Real > * > &A, MatrixTransposeType transA, const std::vector< CuSubMatrix< Real > * > &B, MatrixTransposeType transB, const Real beta)
Does multiple matrix multiplications, executing them in parallel using cuBLAS&#39;s gemmBatched if we are...
Definition: cu-matrix.cc:2207

kaldi::CuMatrixBase::ApplyLogSoftMaxPerRow
void ApplyLogSoftMaxPerRow()
Definition: cu-matrix.h:476

kaldi::MatrixIndexT
int32 MatrixIndexT
Definition: matrix-common.h:98

kaldi::CuMatrixBase::SetRandUniform
void SetRandUniform()
Definition: cu-matrix.cc:3146

kaldi::CuMatrixBase::AddVecToRows
void AddVecToRows(Real alpha, const CuVectorBase< Real > &row, Real beta=1.0)
(for each row r of *this), r = alpha * row + beta * r
Definition: cu-matrix.cc:1261

kaldi::CuMatrixBase::ApplyPowAbs
void ApplyPowAbs(Real power, bool include_sign=false)
Definition: cu-matrix.h:443

float

kaldi::CuMatrixBase::CopyFromSp
void CopyFromSp(const CuSpMatrix< Real > &M)
Definition: cu-matrix.cc:360

kaldi::CuMatrixBase::Sigmoid
void Sigmoid(const CuMatrixBase< Real > &src)
Set each element to the sigmoid of the corresponding element of "src": element by element...
Definition: cu-matrix.cc:1534

kaldi::CuMatrixBase::Add
void Add(Real value)
Definition: cu-matrix.cc:582

kaldi::CuMatrixBase::DiffXent
void DiffXent(const CuArrayBase< int32 > &tgt, CuVector< Real > *log_post_tgt)
Differentiate the block [softmax+cross-entropy] : dE/da = posterior_mat - target_mat, &#39;E&#39; is error function, &#39;a&#39; is activation on softmax input.
Definition: cu-matrix.cc:1957

kaldi::CuMatrixBase::AddToRows
void AddToRows(Real alpha, const CuArrayBase< MatrixIndexT > &indexes, CuMatrixBase< Real > *dst) const
For each row i of *this, adds this->Row(i) to dst->Row(indexes(i)) if indexes(i) >= 0...
Definition: cu-matrix.cc:2869

kaldi::CuMatrixBase::SetZero
void SetZero()
Math operations, some calling kernels.
Definition: cu-matrix.cc:509

kaldi::CuMatrixBase::SoftMaxPerRow
void SoftMaxPerRow(const CuMatrixBase< Real > &src)
Softmax nonlinearity Y = Softmax(X) : Yij = e^Xij / sum_k(e^Xik), done to each row, with attention to avoiding overflow or underflow.
Definition: cu-matrix.cc:1717

kaldi::kDefaultStride
Definition: matrix-common.h:45

kaldi::CuMatrixBase::MulRows
void MulRows(const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Does for each row r, this.Row(r) *= alpha * src.row(indexes[r]), where &#39;*=&#39; is elementwise multiplica...
Definition: cu-matrix.cc:2790

kaldi::CuMatrixBase::MulElements
void MulElements(const CuMatrixBase< Real > &A)
Multiply two matrices elementwise: C = C .* A.
Definition: cu-matrix.cc:667

kaldi::CuMatrixBase::CopyRows
void CopyRows(const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Copies row r from row indexes[r] of src.
Definition: cu-matrix.cc:2678

kaldi::CuMatrixBase::CopyFromBlock
void CopyFromBlock(const CuBlockMatrix< Real > &B, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:161

kaldi::MatrixStrideType
MatrixStrideType
Definition: matrix-common.h:44

kaldi::CuMatrixBase::SymAddMat2
void SymAddMat2(const Real alpha, const CuMatrixBase< Real > &M, MatrixTransposeType transA, Real beta)
*this = beta * *this + alpha * M M^T, for symmetric matrices.
Definition: cu-matrix.cc:1353

kaldi::CuMatrixBase::CopyColsFromVec
void CopyColsFromVec(const CuVectorBase< Real > &v)
Copies vector into matrix, column-by-column.
Definition: cu-matrix.cc:2376

kaldi::kNoTrans
Definition: matrix-common.h:34

kaldi::CuMatrixBase::GroupPnorm
void GroupPnorm(const CuMatrixBase< Real > &src, Real pow)
Apply the function y(i) = (sum_{j = i*G}^{(i+1)*G-1} x_j ^ (power)) ^ (1 / p) where G = x...
Definition: cu-matrix.cc:1576

KALDI_PARANOID_ASSERT
#define KALDI_PARANOID_ASSERT(cond)
Definition: kaldi-error.h:206

kaldi::CuMatrixBase::AddMatMat
void AddMatMat(Real alpha, const CuMatrixBase< Real > &A, MatrixTransposeType transA, const CuMatrixBase< Real > &B, MatrixTransposeType transB, Real beta)
C = alpha * A(^T)*B(^T) + beta * C.
Definition: cu-matrix.cc:1291

kaldi::CuMatrixBase::Cholesky
void Cholesky(CuMatrixBase< Real > *inv_cholesky=NULL)
This function does sets *this to the Cholesky factor of *this (i.e.
Definition: cu-matrix.cc:1987

kaldi::TraceMatMat
Real TraceMatMat(const MatrixBase< Real > &A, const MatrixBase< Real > &B, MatrixTransposeType trans)
We need to declare this here as it will be a friend function.
Definition: kaldi-matrix.cc:2692

kaldi::CuSubMatrix
This class is used for a piece of a CuMatrix.
Definition: matrix-common.h:70

kaldi::CuMatrixBase::DivElements
void DivElements(const CuMatrixBase< Real > &A)
Divide two matrices elementwise: C = A ./ A.
Definition: cu-matrix.cc:691

kaldi::CuMatrixBase::KALDI_DISALLOW_COPY_AND_ASSIGN
KALDI_DISALLOW_COPY_AND_ASSIGN(CuMatrixBase)

kaldi::CuMatrixBase::DiffSoftmaxPerRow
void DiffSoftmaxPerRow(const CuMatrixBase< Real > &value, const CuMatrixBase< Real > &diff)
Differentiate backward through the softmax function.
Definition: cu-matrix.cc:1868

kaldi::CuMatrixBase::GroupMaxDeriv
void GroupMaxDeriv(const CuMatrixBase< Real > &input, const CuMatrixBase< Real > &output)
Calculate derivatives for the GroupMax function above, where "input" is the input to the GroupMax fun...
Definition: cu-matrix.cc:874

kaldi::CuMatrixBase::RowRange
CuSubMatrix< Real > RowRange(const MatrixIndexT row_offset, const MatrixIndexT num_rows) const
Definition: cu-matrix.h:660

kaldi::CuMatrixBase::DiffTanh
void DiffTanh(const CuMatrixBase< Real > &value, const CuMatrixBase< Real > &diff)
Differentiate backward through the tanh function.
Definition: cu-matrix.cc:1809

kaldi::CuMatrixBase::RowData
Real * RowData(MatrixIndexT r)
Get raw row pointer.
Definition: cu-matrix.h:743

kaldi::CuMatrixBase::CopyFromGeneralMat
void CopyFromGeneralMat(const GeneralMatrix &src, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:3096

kaldi::CuMatrixBase::FindRowMaxId
void FindRowMaxId(CuArray< int32 > *id) const
Find the id of the maximal element for each row (resizes the &#39;id&#39; array to the appropriate size)...
Definition: cu-matrix.cc:1829

kaldi::CuMatrixBase::CopyLowerToUpper
void CopyLowerToUpper()
Definition: cu-matrix.cc:2969

kaldi::CuMatrixBase::Heaviside
void Heaviside(const CuMatrixBase< Real > &src)
Set each element to the Heaviside function of the corresponding element of "src", which we define as ...
Definition: cu-matrix.cc:2435

kaldi::CuMatrixBase::ApplyExp
void ApplyExp()
Definition: cu-matrix.h:459

kaldi::CuMatrixBase::DiffSigmoid
void DiffSigmoid(const CuMatrixBase< Real > &value, const CuMatrixBase< Real > &diff)
Differentiate backward through the sigmoid function.
Definition: cu-matrix.cc:1764

kaldi::CuMatrixBase::MulColsVec
void MulColsVec(const CuVectorBase< Real > &scale)
scale i&#39;th column by scale[i]
Definition: cu-matrix.cc:765

kaldi::CuMatrixBase::Data
const Real * Data() const
Return data pointer (const).
Definition: cu-matrix.h:746

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::CuMatrixBase::SumColumnRanges
void SumColumnRanges(const CuMatrixBase< Real > &src, const CuArrayBase< Int32Pair > &indexes)
For each row r of this and for each column c, sets (*this)(r, c) to the sum  src(r, j), where j ranges from indexes[c].first through indexes[c].second - 1.
Definition: cu-matrix.cc:2893

kaldi::CuMatrixBase::ColRange
CuSubMatrix< Real > ColRange(const MatrixIndexT col_offset, const MatrixIndexT num_cols) const
Definition: cu-matrix.h:665

cu-math.h

kaldi::CuMatrixBase::CuMatrixBase
CuMatrixBase(Real *data, MatrixIndexT num_rows, MatrixIndexT num_cols, MatrixIndexT stride)
This constructor takes the #rows, #cols and stride; it&#39;s called from the constructor of CuSubMatrix...
Definition: cu-matrix.h:771

kaldi::CuMatrixBase::ApplyExpSpecial
void ApplyExpSpecial()
Definition: cu-matrix.h:468

kaldi::CuMatrixBase
Matrix for CUDA computing.
Definition: matrix-common.h:69

kaldi::CuMatrixBase::ApplyExpLimited
void ApplyExpLimited(Real lower_limit, Real upper_limit)
Definition: cu-matrix.h:464

kaldi::CuMatrixBase::NumCols
MatrixIndexT NumCols() const
Definition: cu-matrix.h:216

kaldi::CuMatrixBase::ApplySoftMaxPerRow
void ApplySoftMaxPerRow()
Definition: cu-matrix.h:472

kaldi::CuMatrixBase::DiffLogSoftmaxPerRow
void DiffLogSoftmaxPerRow(const CuMatrixBase< Real > &out_value, const CuMatrixBase< Real > &out_deriv)
Differentiate backward through the log softmax function.
Definition: cu-matrix.cc:1903

kaldi::CuMatrixBase::DiffGroupPnorm
void DiffGroupPnorm(const CuMatrixBase< Real > &in_value, const CuMatrixBase< Real > &out_value, const CuMatrixBase< Real > &out_deriv, Real power)
Differentiate backward through the GroupPnorm function.
Definition: cu-matrix.cc:841

kaldi::CuMatrixBase::operator()
CuValue< Real > operator()(MatrixIndexT r, MatrixIndexT c)
Definition: cu-matrix.h:682

kaldi::CuArrayBase
Class CuArrayBase, CuSubArray and CuArray are analogues of classes CuVectorBase, CuSubVector and CuVe...
Definition: cu-array.h:44

kaldi::CuArray< int32 >

kaldi::kSetZero
Definition: matrix-common.h:38

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::CuSparseMatrix
Definition: matrix-common.h:78

cu-common.h

kaldi::MatrixBase::NumRows
MatrixIndexT NumRows() const
Returns number of rows (or zero for empty matrix).
Definition: kaldi-matrix.h:64

kaldi::CuMatrixBase::TraceMatMat
friend Real TraceMatMat(const CuMatrixBase< Real > &A, const CuMatrixBase< Real > &B, MatrixTransposeType trans)
Definition: cu-matrix.cc:2145

kaldi::CuMatrixBase::CopyFromTp
void CopyFromTp(const CuTpMatrix< OtherReal > &M, MatrixTransposeType trans=kNoTrans)
Definition: cu-matrix.cc:280

kaldi::MatrixTransposeType
MatrixTransposeType
Definition: matrix-common.h:32

cu-value.h

kaldi::AssertEqual
static void AssertEqual(float a, float b, float relative_tolerance=0.001)
assert abs(a - b) <= relative_tolerance * (abs(a)+abs(b))
Definition: kaldi-math.h:276

kaldi::CuMatrixBase::MulRowsGroupMat
void MulRowsGroupMat(const CuMatrixBase< Real > &src)
divide each row into src.NumCols() groups, and then scale i&#39;th row&#39;s jth group of elements by src[i...
Definition: cu-matrix.cc:816

kaldi::CuMatrixBase::Min
Real Min() const
Definition: cu-matrix.cc:3054

kaldi::CuMatrixBase::num_cols_
MatrixIndexT num_cols_
Definition: cu-matrix.h:785

kaldi::CuMatrixBase::Dim
::MatrixDim Dim() const
Definition: cu-matrix.h:221

kaldi::CuMatrixBase::FrobeniusNorm
Real FrobeniusNorm() const
Definition: cu-matrix.h:226

kaldi::CuMatrixBase::CopyCols
void CopyCols(const CuMatrixBase< Real > &src, const CuArrayBase< MatrixIndexT > &indexes)
Copies column r from column indexes[r] of src.
Definition: cu-matrix.cc:2656

kaldi::CuMatrixBase::PowAbs
void PowAbs(const CuMatrixBase< Real > &src, Real power, bool include_sign=false)
Apply power to the absolute value of each element.
Definition: cu-matrix.cc:2521

kaldi::CuMatrixBase::CopyToRows
void CopyToRows(const CuArrayBase< Real *> &dst) const
For each row r of this matrix, copies it to the array of floats at the location given by dst[r]...
Definition: cu-matrix.cc:2744

kaldi::CuTpMatrix
Definition: matrix-common.h:77

kaldi::SameDimAndStride
bool SameDimAndStride(const CuMatrixBase< Real > &M, const CuMatrixBase< Real > &N)
Definition: cu-matrix.h:954

kaldi::CuMatrixBase::AddSpMat
void AddSpMat(const Real alpha, const CuSpMatrix< Real > &A, const CuMatrixBase< Real > &B, MatrixTransposeType transB, const Real beta)
this <– beta*this + alpha*SpA*B
Definition: cu-matrix.h:623

kaldi::CuMatrixBase::LogSoftMaxPerRow
void LogSoftMaxPerRow(const CuMatrixBase< Real > &src)
LogSoftmax nonlinearity Y = LogSoftmax(X) : Yij = Xij - log(sum_k(e^Xik)), done to each row...
Definition: cu-matrix.cc:1740

kaldi::CuMatrixBase::NumRows
MatrixIndexT NumRows() const
Dimensions.
Definition: cu-matrix.h:215

kaldi::CuPackedMatrix::NumCols
MatrixIndexT NumCols() const
Definition: cu-packed-matrix.h:136

kaldi::VectorBase
Provides a vector abstraction class.
Definition: kaldi-vector.h:41

kaldi::CuMatrixBase::ExpSpecial
void ExpSpecial(const CuMatrixBase< Real > &src)
For each element x of the matrix, set it to (x < 0 ? exp(x) : x + 1).
Definition: cu-matrix.cc:2563

cu-matrixdim.h

kaldi::CuMatrixBase::SetMatMatDivMat
void SetMatMatDivMat(const CuMatrixBase< Real > &A, const CuMatrixBase< Real > &B, const CuMatrixBase< Real > &C)
*this = a * b / c (by element; when c = 0, *this = a) *this can be an alias of a, b or c safely and g...
Definition: cu-matrix.cc:1206

kaldi::CuMatrix::Mat
const Matrix< Real > & Mat() const
Definition: cu-matrix.h:879

kaldi::CuMatrixBase::Tanh
void Tanh(const CuMatrixBase< Real > &src)
Compute the hyperbolic tangent (tanh) function; element by element, *this = tanh(src).
Definition: cu-matrix.cc:1786

cu-sparse-matrix.h

kaldi::CuMatrixBase::Max
Real Max() const
Definition: cu-matrix.cc:3033

kaldi::CuMatrixBase::ParametricRelu
void ParametricRelu(const CuMatrixBase< Real > &src, const CuVectorBase< Real > &alpha, const CuVectorBase< Real > &beta)
Compute the parametric rectified linear unit function; element by element, *this = src * (src > 0 ...
Definition: cu-matrix.cc:1467

kaldi::CuMatrixBase::Set
void Set(Real value)
Definition: cu-matrix.cc:531

kaldi::CuMatrixBase::DiffParametricRelu
void DiffParametricRelu(const CuMatrixBase< Real > &value, const CuMatrixBase< Real > &diff, const CuVectorBase< Real > &alpha, const CuVectorBase< Real > &beta)
Differentiate backward through the parametric relu function.
Definition: cu-matrix.cc:1501

kaldi::CuMatrixBase::MulRowsVec
void MulRowsVec(const CuVectorBase< Real > &scale)
scale i&#39;th row by scale[i]
Definition: cu-matrix.cc:792

kaldi::CuMatrixBase::EqualElementMask
void EqualElementMask(const CuMatrixBase< Real > &mat, CuMatrix< Real > *mask) const
Definition: cu-matrix.cc:3429

cu-array.h

kaldi::CuMatrixBase::AddMatSmat
void AddMatSmat(Real alpha, const CuMatrixBase< Real > &A, const CuSparseMatrix< Real > &B, MatrixTransposeType transB, Real beta)
(*this) = alpha * A * op(B) + beta * (*this), where B is sparse and op(B) is either B or trans(B) dep...
Definition: cu-matrix.cc:1080

kaldi::CuMatrixBase::Exp
void Exp(const CuMatrixBase< Real > &src)
Definition: cu-matrix.cc:2456

kaldi::CuMatrixBase::AddVecVec
void AddVecVec(Real alpha, const CuVectorBase< Real > &x, const CuVectorBase< Real > &y)
A = alpha * x * y^T + A .
Definition: cu-matrix.cc:1329

rnnlm::d
double d
Definition: mikolov-rnnlm-lib.cc:64

kaldi::CuMatrixBase::SetZeroAboveDiag
void SetZeroAboveDiag()
Zeroes all elements for which col > row.
Definition: cu-matrix.cc:554

kaldi::CuVectorBase
Vector for CUDA computing.
Definition: matrix-common.h:72

cu-matrix-inl.h

kaldi::CuMatrixBase::AddDiagVecMat
void AddDiagVecMat(const Real alpha, const CuVectorBase< Real > &v, const CuMatrixBase< Real > &M, MatrixTransposeType transM, Real beta=1.0)
*this = beta * *this + alpha * diag(v) * M [or M^T].
Definition: cu-matrix.cc:1382

kaldi::CuMatrixBase::RowData
const Real * RowData(MatrixIndexT r) const
Get raw row pointer (const).
Definition: cu-matrix.h:740

kaldi::CuMatrixBase::num_rows_
MatrixIndexT num_rows_
Definition: cu-matrix.h:786