Skip to content

Commit 1e735d2

Browse files
Added missing __syncthreads();
1 parent ae0b2a9 commit 1e735d2

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

ggml-cuda.cu

+1
Original file line numberDiff line numberDiff line change
@@ -229,6 +229,7 @@ template <int block_size, int qk, dequantize_kernel_t dequantize_kernel> static
229229
}
230230

231231
// sum up partial sums and write back result
232+
__syncthreads();
232233
for (int s=block_size/2; s>0; s>>=1) {
233234
if (tid < s) {
234235
tmp[tid] += tmp[tid + s];

0 commit comments

Comments
 (0)