From e2953d47c5478bdf9268e4f2bf66464b864f8ef6 Mon Sep 17 00:00:00 2001 From: Haicheng Wu <57973641+hwu36@users.noreply.github.com> Date: Fri, 12 May 2023 15:37:31 -0400 Subject: [PATCH] Update gemm_api.md --- media/docs/gemm_api.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/media/docs/gemm_api.md b/media/docs/gemm_api.md index f19bf35d..a11a3bbc 100644 --- a/media/docs/gemm_api.md +++ b/media/docs/gemm_api.md @@ -28,7 +28,7 @@ for (int cta_n = 0; cta_n < GemmN; cta_n += CtaTileN) { // f for (int warp_n = 0; warp_n < CtaTileN; warp_n += WarpTileN) { // for each warp } warp-level concurrency for (int warp_m = 0; warp_m < CtaTileM; warp_m += WarpTileM) { // for each warp } // - for (int warp_k = 0; warp_k < CtaTileK; warp_k += MmaK) { // fully unroll across CtaTileK - one iteration of this loop is one "k Group" == "MmaK" + for (int warp_k = 0; warp_k < CtaTileK; warp_k += WarpTileK) { // fully unroll across CtaTileK - one iteration of this loop is one "k Group" // for (int mma_k = 0; mma_k < WarpTileK; mma_k += MmaK) { // cutlass::gemm::warp::Mma for (int mma_n = 0; mma_n < WarpTileN; mma_n += MmaN) { //