cu-matrixdim.h 2.81 KB
// cudamatrix/cu-matrixdim.h

// Copyright 2009-2012  Karel Vesely
//                2013  Johns Hopkins University (author: Daniel Povey)

// See ../../COPYING for clarification regarding multiple authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//  http://www.apache.org/licenses/LICENSE-2.0
//
// THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
// WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
// MERCHANTABLITY OR NON-INFRINGEMENT.
// See the Apache 2 License for the specific language governing permissions and
// limitations under the License.



#ifndef KALDI_CUDAMATRIX_CU_MATRIXDIM_H_
#define KALDI_CUDAMATRIX_CU_MATRIXDIM_H_

/*
 * Typedefs needed for ANSI-C interface of CUDA wrappers
 */
#include <cstdint>
typedef uint32_t         uint32_cuda;
typedef int32_t          int32_cuda;
typedef int32_t          MatrixIndexT_cuda; // you'd have to change this if you changed MatrixIndexT from int32.

template<typename Real>
struct MatrixElement {
  int32_cuda row;
  int32_cuda column;
  Real weight;
};

extern "C" {
  /**
   * Structure containing size of the matrix plus stride.
   * This structure is an argument of most of the CUDA kernels.
   */
  typedef struct MatrixDim_ {
    int32_cuda rows;
    int32_cuda cols;
    int32_cuda stride;
  } MatrixDim;

// we define the following constants here because this file is included
// both by the C++ code and also CUDA code.


// The size of a CUDA 1-d block, e.g. for vector operations..
#define CU1DBLOCK 256

// The size of edge of CUDA square block, e.g. for matrix operations.
// Must be defined the same in cu-kernels-ansi.h
#define CU2DBLOCK 16


  /** This structure is used in cu-block-matrix.h to store information
      about a block-diagonal matrix.  We declare it here so that it
      will be accessible
   */
  typedef struct CuBlockMatrixData_ {
    int32_cuda row_offset; // sum of #rows of previous M_i
    int32_cuda col_offset; // sum of #cols of previous M_i
    MatrixDim matrix_dim; // dimension of this M_i
    void *matrix_data; // data for M_i.  This is a pointer to either float* or
                       // double*.  Because C doesn't support templates and to
                       // avoid extra coding to support the two cases, we
                       // decided to make this a void* pointer.
  } CuBlockMatrixData;

  typedef struct Int32Pair {
    int32_cuda first;
    int32_cuda second;
  } Int32Pair;

  inline bool operator<(const Int32Pair &a, const Int32Pair &b) {
    if (a.first < b.first)
      return true;
    if (a.first > b.first)
      return false;
    return a.second < b.second;
  }
}

#endif