|
|
@@ -262,11 +262,11 @@ static bool cp_async_available(const int cc) {
|
|
|
}
|
|
|
|
|
|
static constexpr __device__ int ggml_cuda_get_physical_warp_size() {
|
|
|
-#if defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)
|
|
|
- return __AMDGCN_WAVEFRONT_SIZE;
|
|
|
+#if defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__) && (defined(__GFX9__) || defined(__GFX8__))
|
|
|
+ return 64;
|
|
|
#else
|
|
|
return 32;
|
|
|
-#endif // defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)
|
|
|
+#endif // defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__) && (defined(__GFX9__) || defined(__GFX8__))
|
|
|
}
|
|
|
|
|
|
[[noreturn]]
|