diff --git a/include/cutlass/arch/mma.h b/include/cutlass/arch/mma.h index 7385d882..2bcabb2d 100644 --- a/include/cutlass/arch/mma.h +++ b/include/cutlass/arch/mma.h @@ -70,7 +70,7 @@ struct OpMultiplyAddFastF16 {}; /// Tag indicating the input is converted to 2 (big and small) TF32 components // Perform 3xTF32 or 4xTF32 for every F32 output element -struct OpMultiplyAddFastF32 {} +struct OpMultiplyAddFastF32 {}; /// Tag indicating the input is converted to 2 (big and small) TF32 components // Perform 3xTF32 or 4xTF32 for every complex output element