Skip to content

Commit 1118c04

Browse files
authored
correct mistake in conditionality for attn.k
1 parent 8006b15 commit 1118c04

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/llama.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15414,10 +15414,10 @@ static ggml_type llama_tensor_get_type(quantize_state_internal & qs, ggml_type n
1541415414
// TODO: explore better strategies
1541515415
new_type = GGML_TYPE_Q8_0;
1541615416
}
15417-
else if (ftype == LLAMA_FTYPE_MOSTLY_IQ3_XS && (qs.model.hparams.n_gqa() < 2 || qs.model.hparams.n_expert < 2)) {
15417+
else if (ftype == LLAMA_FTYPE_MOSTLY_IQ3_XS && qs.model.hparams.n_gqa() < 2 && qs.model.hparams.n_expert < 2) {
1541815418
new_type = GGML_TYPE_IQ3_XXS;
1541915419
}
15420-
else if (ftype == LLAMA_FTYPE_MOSTLY_IQ3_XXS && (qs.model.hparams.n_gqa() < 2 || qs.model.hparams.n_expert < 2)) {
15420+
else if (ftype == LLAMA_FTYPE_MOSTLY_IQ3_XXS && qs.model.hparams.n_gqa() < 2 && qs.model.hparams.n_expert < 2) {
1542115421
new_type = GGML_TYPE_IQ2_S;
1542215422
}
1542315423
} else if (name.find("attn_q.weight") != std::string::npos) {

0 commit comments

Comments
 (0)