Skip to content

Commit 7ec5b63

Browse files
Removed hipblas compatibility code
1 parent 72bf00b commit 7ec5b63

File tree

1 file changed

+0
-12
lines changed

1 file changed

+0
-12
lines changed

ggml-cuda.cu

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -220,22 +220,10 @@ static __global__ void dequantize_mul_mat_vec(const void * vx, const float * y,
220220

221221
// sum up partial sums and write back result
222222
__syncthreads();
223-
#ifdef GGML_USE_HIPBLAS
224-
__shared__ float tmpa[block_size];
225-
tmpa[tid] = tmp;
226-
for (int s=block_size/2; s>0; s>>=1) {
227-
if (tid < s) {
228-
tmpa[tid] += tmpa[tid + s];
229-
}
230-
__syncthreads();
231-
}
232-
tmp = tmpa[0]; // now full sum
233-
#else
234223
#pragma unroll
235224
for (int mask = 16; mask > 0; mask >>= 1) {
236225
tmp += __shfl_xor_sync(0xffffffff, tmp, mask, 32);
237226
}
238-
#endif
239227

240228
if (tid == 0) {
241229
dst[row] = tmp;

0 commit comments

Comments
 (0)