Skip to content

Commit 0770ec9

Browse files
committed
Fix RDNA4 perf
1 parent 37b9f0d commit 0770ec9

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-cuda/ggml-cuda.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1247,7 +1247,7 @@ static void ggml_cuda_op_mul_mat_cublas(
12471247

12481248
CUBLAS_CHECK(cublasSetStream(ctx.cublas_handle(id), stream));
12491249

1250-
if (GGML_CUDA_CC_IS_CDNA(cc) || GGML_CUDA_CC_IS_RDNA4(cc)) {
1250+
if (GGML_CUDA_CC_IS_CDNA(cc)) {
12511251
const float alpha = 1.0f;
12521252
const float beta = 0.0f;
12531253
CUBLAS_CHECK(
@@ -1792,7 +1792,7 @@ static void ggml_cuda_mul_mat_batched_cublas(ggml_backend_cuda_context & ctx, co
17921792

17931793
int id = ggml_cuda_get_device();
17941794
const int cc = ggml_cuda_info().devices[id].cc;
1795-
if (GGML_CUDA_CC_IS_CDNA(cc) || GGML_CUDA_CC_IS_RDNA4(cc)) {
1795+
if (GGML_CUDA_CC_IS_CDNA(cc)) {
17961796
cu_compute_type = CUBLAS_COMPUTE_32F;
17971797
alpha = &alpha_f32;
17981798
beta = &beta_f32;

0 commit comments

Comments
 (0)