Skip to content

Commit 194a0fd

Browse files
authored
Merge branch 'ggerganov:master' into sycl
2 parents 3b4e035 + 3466c6e commit 194a0fd

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

llama.cpp

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1336,8 +1336,10 @@ static llama_state g_state;
13361336
// available llama models
13371337
enum e_model {
13381338
MODEL_UNKNOWN,
1339+
MODEL_0_5B,
13391340
MODEL_1B,
13401341
MODEL_3B,
1342+
MODEL_4B,
13411343
MODEL_7B,
13421344
MODEL_8B,
13431345
MODEL_13B,
@@ -3006,9 +3008,9 @@ static void llm_load_hparams(
30063008
{
30073009
ml.get_key(LLM_KV_ATTENTION_LAYERNORM_RMS_EPS, hparams.f_norm_rms_eps);
30083010
switch (hparams.n_layer) {
3009-
case 24: model.type = e_model::MODEL_1B; break;
3011+
case 24: model.type = hparams.n_embd == 1024 ? e_model::MODEL_0_5B : e_model::MODEL_1B; break;
30103012
case 32: model.type = e_model::MODEL_7B; break;
3011-
case 40: model.type = e_model::MODEL_13B; break;
3013+
case 40: model.type = hparams.n_head == 20 ? e_model::MODEL_4B : e_model::MODEL_13B; break;
30123014
case 80: model.type = e_model::MODEL_70B; break;
30133015
default: model.type = e_model::MODEL_UNKNOWN;
30143016
}

0 commit comments

Comments
 (0)