Merge pull request #30 from NVIDIA/fix_utilities_example

Fixed cutlass_utilities example.
2018-09-29 15:09:18 -07:00 · 2018-09-29 15:09:18 -07:00 · 2332df492e
commit 2332df492e
parent 6877595a5e cfe4b933ef
1 changed files with 9 additions and 9 deletions
--- a/examples/02_cutlass_utilities/cutlass_utilities.cu
+++ b/examples/02_cutlass_utilities/cutlass_utilities.cu
@ -144,18 +144,18 @@ cudaError_t Cutlass_FP16_SgemmNN(
  typename Gemm::Params params;

  int result = params.initialize(
-    M,                  // GEMM M dimension
-    N,                  // GEMM N dimension
-    K,                  // GEMM K dimension
-    half(float(alpha)), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
-    A,                  // matrix A operand
+    M,                                     // GEMM M dimension
+    N,                                     // GEMM N dimension
+    K,                                     // GEMM K dimension
+    reinterpret_cast<half const &>(alpha), // scalar alpha - This is a legal conversion from cutlass::half_t to CUDA's half.
+    A,                                     // matrix A operand
    lda,
-    B,                  // matrix B operand
+    B,                                     // matrix B operand
    ldb,
-    half(float(beta)),  // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
-    C,                  // source matrix C
+    reinterpret_cast<half const &>(beta),  // scalar beta - This is a legal conversion from cutlass::half_t to CUDA's half.
+    C,                                     // source matrix C
    ldc,
-    C,                  // destination matrix C (may be different memory than source C matrix)
+    C,                                     // destination matrix C (may be different memory than source C matrix)
    ldc
  );