Skip to content

Commit d37eab8

Browse files
authored
Revert "[src] Better kernels for CUDA row sum and tr(AB^T) (kaldi-asr#3954)"
This reverts commit 673c6fc.
1 parent 91ff64e commit d37eab8

File tree

5 files changed

+30
-365
lines changed

5 files changed

+30
-365
lines changed

src/cudamatrix/cu-kernels-ansi.h

+4-4
Original file line numberDiff line numberDiff line change
@@ -40,10 +40,10 @@ typedef float BaseFloat;
4040
#endif
4141

4242

43-
void cudaD_add_row_sum_mat(double* result, const double* mat, void* scratch,
43+
void cudaD_add_row_sum_mat(int Gr, int Bl, double* result, const double* mat,
4444
const MatrixDim d, const double alpha,
4545
const double beta);
46-
void cudaF_add_row_sum_mat(float* result, const float* mat, void* scratch,
46+
void cudaF_add_row_sum_mat(int Gr, int Bl, float* result, const float* mat,
4747
const MatrixDim d, const float alpha,
4848
const float beta);
4949
void cudaD_add_col_sum_mat(int Gr, int Bl, double* result, const double* mat,
@@ -713,10 +713,10 @@ void cudaD_trace_mat_mat(dim3 Gr, dim3 Bl, const double* A, const double* B,
713713
MatrixDim dA, int B_stride, double* value);
714714
void cudaF_trace_mat_mat(dim3 Gr, dim3 Bl, const float* A, const float* B,
715715
MatrixDim dA, int B_stride, float* value);
716-
void cudaD_trace_mat_mat_trans(const double* A,
716+
void cudaD_trace_mat_mat_trans(dim3 Gr, dim3 Bl, const double* A,
717717
const double* B, MatrixDim dA, int B_stride,
718718
double* value);
719-
void cudaF_trace_mat_mat_trans(const float* A, const float* B,
719+
void cudaF_trace_mat_mat_trans(dim3 Gr, dim3 Bl, const float* A, const float* B,
720720
MatrixDim dA, int B_stride, float* value);
721721
void cudaD_trace_mat_smat(dim3 Gr, dim3 Bl, const double* mat,
722722
MatrixDim mat_dim, const int* smat_row_ptr,

0 commit comments

Comments
 (0)