Skip to content

Commit 4329d1a

Browse files
authored
CUDA: use min compute capability of GPUs actually used (#2506)
1 parent 02f9d96 commit 4329d1a

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

ggml-cuda.cu

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5347,7 +5347,8 @@ void ggml_cuda_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1, ggml_
53475347
} else {
53485348
int min_compute_capability = INT_MAX;
53495349
for (int id = 0; id < g_device_count; ++id) {
5350-
if (min_compute_capability > g_compute_capabilities[id]) {
5350+
if (min_compute_capability > g_compute_capabilities[id]
5351+
&& g_tensor_split[id] < (id + 1 < g_device_count ? g_tensor_split[id + 1] : 1.0f)) {
53515352
min_compute_capability = g_compute_capabilities[id];
53525353
}
53535354
}

0 commit comments

Comments
 (0)