diff --git a/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h b/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h index 890504c7..24b7f3e7 100644 --- a/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h +++ b/include/cutlass/gemm/warp/mma_tensor_op_tile_iterator.h @@ -403,7 +403,7 @@ public: AccessType const *source_ptr = pointer_[c % kPointerCount] + Layout::TileShape::kContiguous * (c / kPointerCount) + - Policy::LdsmShape::kStrided * s * stride_; + Policy::kLdsmOpInner * Policy::LdsmShape::kStrided * s * stride_; char const *source_byte_ptr = reinterpret_cast(source_ptr) + byte_offset + byte_offset_;