@@ -40,10 +40,10 @@ typedef float BaseFloat;
40
40
#endif
41
41
42
42
43
- void cudaD_add_row_sum_mat (double * result , const double * mat , void * scratch ,
43
+ void cudaD_add_row_sum_mat (int Gr , int Bl , double * result , const double * mat ,
44
44
const MatrixDim d , const double alpha ,
45
45
const double beta );
46
- void cudaF_add_row_sum_mat (float * result , const float * mat , void * scratch ,
46
+ void cudaF_add_row_sum_mat (int Gr , int Bl , float * result , const float * mat ,
47
47
const MatrixDim d , const float alpha ,
48
48
const float beta );
49
49
void cudaD_add_col_sum_mat (int Gr , int Bl , double * result , const double * mat ,
@@ -713,10 +713,10 @@ void cudaD_trace_mat_mat(dim3 Gr, dim3 Bl, const double* A, const double* B,
713
713
MatrixDim dA , int B_stride , double * value );
714
714
void cudaF_trace_mat_mat (dim3 Gr , dim3 Bl , const float * A , const float * B ,
715
715
MatrixDim dA , int B_stride , float * value );
716
- void cudaD_trace_mat_mat_trans (const double * A ,
716
+ void cudaD_trace_mat_mat_trans (dim3 Gr , dim3 Bl , const double * A ,
717
717
const double * B , MatrixDim dA , int B_stride ,
718
718
double * value );
719
- void cudaF_trace_mat_mat_trans (const float * A , const float * B ,
719
+ void cudaF_trace_mat_mat_trans (dim3 Gr , dim3 Bl , const float * A , const float * B ,
720
720
MatrixDim dA , int B_stride , float * value );
721
721
void cudaD_trace_mat_smat (dim3 Gr , dim3 Bl , const double * mat ,
722
722
MatrixDim mat_dim , const int * smat_row_ptr ,
0 commit comments