Skip to content

Commit

Permalink
Merge pull request NVIDIA#30 from NVIDIA/fix_utilities_example
Browse files Browse the repository at this point in the history
Fixed cutlass_utilities example.
  • Loading branch information
kerrmudgeon authored Sep 29, 2018
2 parents 6877595 + cfe4b93 commit 2332df4
Showing 1 changed file with 9 additions and 9 deletions.
18 changes: 9 additions & 9 deletions examples/02_cutlass_utilities/cutlass_utilities.cu
Original file line number Diff line number Diff line change
Expand Up @@ -144,18 +144,18 @@ cudaError_t Cutlass_FP16_SgemmNN(
typename Gemm::Params params;

int result = params.initialize(
M, // GEMM M dimension
N, // GEMM N dimension
K, // GEMM K dimension
half(float(alpha)), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
A, // matrix A operand
M, // GEMM M dimension
N, // GEMM N dimension
K, // GEMM K dimension
reinterpret_cast<half const &>(alpha), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
A, // matrix A operand
lda,
B, // matrix B operand
B, // matrix B operand
ldb,
half(float(beta)), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
C, // source matrix C
reinterpret_cast<half const &>(beta), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
C, // source matrix C
ldc,
C, // destination matrix C (may be different memory than source C matrix)
C, // destination matrix C (may be different memory than source C matrix)
ldc
);

Expand Down

0 comments on commit 2332df4

Please sign in to comment.