Skip to content

Commit eea1184

Browse files
try AMD fix
1 parent 827bc1b commit eea1184

File tree

1 file changed

+1
-2
lines changed

1 file changed

+1
-2
lines changed

ggml-cuda/common.cuh

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -316,8 +316,7 @@ static __device__ __forceinline__ int __dp4a(const int a, const int b, int c) {
316316
}
317317
#endif // defined(GGML_USE_HIPBLAS)
318318

319-
#define FP16_AVAILABLE defined(GGML_USE_HIPBLAS) && defined(__HIP_PLATFORM_AMD__) ? \
320-
defined(RDNA1) || defined(RDNA2) || defined(RDNA3) : __CUDA_ARCH__ >= CC_PASCAL
319+
#define FP16_AVAILABLE (defined(GGML_USE_HIPBLAS) && defined(__HIP_PLATFORM_AMD__)) || __CUDA_ARCH__ >= CC_PASCAL
321320

322321
#define FP16_MMA_AVAILABLE !(defined(GGML_USE_HIPBLAS) && defined(__HIP_PLATFORM_AMD__)) && __CUDA_ARCH__ >= CC_VOLTA
323322

0 commit comments

Comments
 (0)