Explicitly cast blockIdx to uint3 (#1192)

This works around a clang issue where blockIdx is of a different type.
This commit is contained in:
Christian Sigg 2023-11-30 06:26:23 +01:00 committed by GitHub
parent a759e85f5f
commit 99c4eebe3b
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -201,7 +201,7 @@ public:
// Get the appropriate blocks for this thread block -- potential for thread block locality
int thread_idx = int(threadIdx.x);
auto blk_shape = TileShape{}; // (BLK_M,BLK_N,BLK_K)
auto [m_coord, n_coord, l_coord] = blockIdx;
auto [m_coord, n_coord, l_coord] = static_cast<uint3>(blockIdx);
auto blk_coord_mnkl = make_coord(m_coord, n_coord, _, l_coord); // (m,n,k,l)
// Represent the full tensors