Procházet zdrojové kódy

CUDA: fix race condition in FA vector kernels (#13742)

Johannes Gäßler před 7 měsíci
rodič
revize
ffd0eae60b

+ 1 - 0
ggml/src/ggml-cuda/fattn-vec-f16.cuh

@@ -212,6 +212,7 @@ static __global__ void flash_attn_vec_ext_f16(
                 }
                 }
             }
             }
             if (__all_sync(0xFFFFFFFF, skip)) {
             if (__all_sync(0xFFFFFFFF, skip)) {
+                __syncthreads();
                 continue;
                 continue;
             }
             }
 #endif // GGML_USE_HIP
 #endif // GGML_USE_HIP

+ 1 - 0
ggml/src/ggml-cuda/fattn-vec-f32.cuh

@@ -217,6 +217,7 @@ static __global__ void flash_attn_vec_ext_f32(
                 }
                 }
             }
             }
             if (__all_sync(0xFFFFFFFF, skip)) {
             if (__all_sync(0xFFFFFFFF, skip)) {
+                __syncthreads();
                 continue;
                 continue;
             }
             }
 #endif // GGML_USE_HIP
 #endif // GGML_USE_HIP