Merge pull request #30 from NVIDIA/fix_utilities_example
Fixed cutlass_utilities example.
This commit is contained in:
commit
2332df492e
@ -147,12 +147,12 @@ cudaError_t Cutlass_FP16_SgemmNN(
|
|||||||
M, // GEMM M dimension
|
M, // GEMM M dimension
|
||||||
N, // GEMM N dimension
|
N, // GEMM N dimension
|
||||||
K, // GEMM K dimension
|
K, // GEMM K dimension
|
||||||
half(float(alpha)), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
|
reinterpret_cast<half const &>(alpha), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
|
||||||
A, // matrix A operand
|
A, // matrix A operand
|
||||||
lda,
|
lda,
|
||||||
B, // matrix B operand
|
B, // matrix B operand
|
||||||
ldb,
|
ldb,
|
||||||
half(float(beta)), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
|
reinterpret_cast<half const &>(beta), // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
|
||||||
C, // source matrix C
|
C, // source matrix C
|
||||||
ldc,
|
ldc,
|
||||||
C, // destination matrix C (may be different memory than source C matrix)
|
C, // destination matrix C (may be different memory than source C matrix)
|
||||||
|
Loading…
Reference in New Issue
Block a user