Merge pull request #30 from NVIDIA/fix_utilities_example

Fixed cutlass_utilities example.
This commit is contained in:
Andrew Kerr 2018-09-29 15:09:18 -07:00 committed by GitHub
commit 2332df492e
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -147,12 +147,12 @@ cudaError_t Cutlass_FP16_SgemmNN(
M, // GEMM M dimension M, // GEMM M dimension
N, // GEMM N dimension N, // GEMM N dimension
K, // GEMM K dimension K, // GEMM K dimension
half(float(alpha)), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half. reinterpret_cast<half const &>(alpha), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
A, // matrix A operand A, // matrix A operand
lda, lda,
B, // matrix B operand B, // matrix B operand
ldb, ldb,
half(float(beta)), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half. reinterpret_cast<half const &>(beta), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
C, // source matrix C C, // source matrix C
ldc, ldc,
C, // destination matrix C (may be different memory than source C matrix) C, // destination matrix C (may be different memory than source C matrix)