We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 2abce2c commit 11649d4Copy full SHA for 11649d4
ggml-cuda.cu
@@ -6356,6 +6356,7 @@ static int64_t get_row_rounding(ggml_type type) {
6356
case GGML_TYPE_Q8_0:
6357
return max_compute_capability >= CC_RDNA2 ? 128 : 64;
6358
case GGML_TYPE_F16:
6359
+ case GGML_TYPE_F32:
6360
return 1;
6361
case GGML_TYPE_Q2_K:
6362
return max_compute_capability >= CC_RDNA2 ? 128 : 32;
@@ -6378,6 +6379,7 @@ static int64_t get_row_rounding(ggml_type type) {
6378
6379
6380
return 64;
6381
6382
6383
6384
6385
case GGML_TYPE_Q3_K:
0 commit comments