Skip to content

Commit bf41f17

Browse files
committed
MUSA: Stop explicitly setting use_mul_mat_vec_q to false
Signed-off-by: Xiaodong Ye <[email protected]>
1 parent 12329e6 commit bf41f17

File tree

2 files changed

+1
-7
lines changed

2 files changed

+1
-7
lines changed

ggml/src/ggml-cuda.cu

-6
Original file line numberDiff line numberDiff line change
@@ -1906,17 +1906,11 @@ static void ggml_cuda_mul_mat(ggml_backend_cuda_context & ctx, const ggml_tensor
19061906
const int cc = ggml_cuda_info().devices[id].cc;
19071907
use_mul_mat_q = use_mul_mat_q && ggml_cuda_should_use_mmq(src0->type, cc, src1->ne[1]);
19081908
any_gpus_with_slow_fp16 = any_gpus_with_slow_fp16 || !fast_fp16_available(cc);
1909-
#ifdef GGML_USE_MUSA
1910-
use_mul_mat_vec_q = false;
1911-
#endif // GGML_USE_MUSA
19121909
}
19131910
} else {
19141911
const int cc = ggml_cuda_info().devices[ctx.device].cc;
19151912
use_mul_mat_q = use_mul_mat_q && ggml_cuda_should_use_mmq(src0->type, cc, src1->ne[1]);
19161913
any_gpus_with_slow_fp16 = any_gpus_with_slow_fp16 || !fast_fp16_available(cc);
1917-
#ifdef GGML_USE_MUSA
1918-
use_mul_mat_vec_q = false;
1919-
#endif // GGML_USE_MUSA
19201914
}
19211915

19221916
// debug helpers

ggml/src/ggml-cuda/common.cuh

+1-1
Original file line numberDiff line numberDiff line change
@@ -181,7 +181,7 @@
181181
#define cudaMemcpyAsync musaMemcpyAsync
182182
#define cudaMemcpyPeerAsync musaMemcpyPeerAsync
183183
#define cudaMemcpy2DAsync musaMemcpy2DAsync
184-
#define cudaMemcpyDeviceToDevice musaMemcpyDeviceToDevice
184+
#define cudaMemcpyDeviceToDevice musaMemcpyDefault
185185
#define cudaMemcpyDeviceToHost musaMemcpyDeviceToHost
186186
#define cudaMemcpyHostToDevice musaMemcpyHostToDevice
187187
#define cudaMemcpyKind musaMemcpyKind

0 commit comments

Comments
 (0)