From dceefe4f645e676e5f30cf63302af426607c3135 Mon Sep 17 00:00:00 2001 From: Pei Sun Date: Mon, 6 Jun 2022 09:33:36 -0700 Subject: [PATCH] Increment stride correctly in warp iterator. (#516) Co-authored-by: peisun1115 --- include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h b/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h index 890504c7..24b7f3e7 100644 --- a/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h +++ b/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h @@ -403,7 +403,7 @@ public: AccessType const *source_ptr = pointer_[c % kPointerCount] + Layout::TileShape::kContiguous * (c / kPointerCount) + - Policy::LdsmShape::kStrided * s * stride_; + Policy::kLdsmOpInner * Policy::LdsmShape::kStrided * s * stride_; char const *source_byte_ptr = reinterpret_cast(source_ptr) + byte_offset + byte_offset_;