Skip to content

Commit d91e765

Browse files
try fix
1 parent 90d8b8d commit d91e765

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml/src/ggml-cuda/common.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -551,7 +551,7 @@ static __device__ __forceinline__ void ggml_cuda_fma(float & acc, const float v,
551551

552552
static __device__ __forceinline__ void ggml_cuda_fma(float & acc, const half2 v, const half2 u) {
553553
#if defined(GGML_USE_HIP) && defined(GCN)
554-
asm volatile("v_dot2_f32_f16 %0, %1, %2, %0" : "=v"(acc) : "v"(v), "v"(u));
554+
asm volatile("v_dot2_f32_f16 %0, %1, %2, %0" : "+v"(acc) : "v"(v), "v"(u));
555555
#else
556556
#ifdef FAST_FP16_AVAILABLE
557557
const float2 tmp = __half22float2(v*u);

0 commit comments

Comments
 (0)