Skip to content

Commit

Permalink
Merge pull request #16 from cjatin/bfloat16_fix
Browse files Browse the repository at this point in the history
Fix ambiguous fma call
  • Loading branch information
mawong-amd authored May 17, 2024
2 parents e3ae076 + e805b3d commit 24584bc
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion csrc/attention/attention_utils.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@ inline __device__ float qk_dot_(const Vec (&q)[N], const Vec (&k)[N]) {
A_vec qk_vec = mul<A_vec, Vec, Vec>(q[0], k[0]);
#pragma unroll
for (int ii = 1; ii < N; ++ii) {
qk_vec = fma(q[ii], k[ii], qk_vec);
qk_vec = vllm::fma(q[ii], k[ii], qk_vec);
}

// Finalize the reduction across lanes.
Expand Down

0 comments on commit 24584bc

Please sign in to comment.