[AMD][CI/Build] Disambiguation of the function call for ROCm 6.2 headers compatibility (#7477)
Co-authored-by: Charlie Fu <Charlie.Fu@amd.com>
This commit is contained in:
parent
7eebe8ccaa
commit
9984605412
@ -34,7 +34,7 @@ inline __device__ float qk_dot_(const Vec (&q)[N], const Vec (&k)[N]) {
|
|||||||
A_vec qk_vec = mul<A_vec, Vec, Vec>(q[0], k[0]);
|
A_vec qk_vec = mul<A_vec, Vec, Vec>(q[0], k[0]);
|
||||||
#pragma unroll
|
#pragma unroll
|
||||||
for (int ii = 1; ii < N; ++ii) {
|
for (int ii = 1; ii < N; ++ii) {
|
||||||
qk_vec = fma(q[ii], k[ii], qk_vec);
|
qk_vec = vllm::fma(q[ii], k[ii], qk_vec);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Finalize the reduction across lanes.
|
// Finalize the reduction across lanes.
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user