|
@@ -10,7 +10,7 @@ static constexpr __device__ int ggml_cuda_fattn_vec_get_nthreads_device() {
|
|
|
return 128;
|
|
return 128;
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
-// Currenlty llvm with the amdgcn target dose not support unrolling loops
|
|
|
|
|
|
|
+// Currenlty llvm with the amdgcn target does not support unrolling loops
|
|
|
// that contain a break that can not be resolved at compile time.
|
|
// that contain a break that can not be resolved at compile time.
|
|
|
#ifdef __clang__
|
|
#ifdef __clang__
|
|
|
#pragma clang diagnostic push
|
|
#pragma clang diagnostic push
|