File tree 1 file changed +4
-2
lines changed 1 file changed +4
-2
lines changed Original file line number Diff line number Diff line change @@ -1336,8 +1336,10 @@ static llama_state g_state;
1336
1336
// available llama models
1337
1337
enum e_model {
1338
1338
MODEL_UNKNOWN,
1339
+ MODEL_0_5B,
1339
1340
MODEL_1B,
1340
1341
MODEL_3B,
1342
+ MODEL_4B,
1341
1343
MODEL_7B,
1342
1344
MODEL_8B,
1343
1345
MODEL_13B,
@@ -3006,9 +3008,9 @@ static void llm_load_hparams(
3006
3008
{
3007
3009
ml.get_key(LLM_KV_ATTENTION_LAYERNORM_RMS_EPS, hparams.f_norm_rms_eps);
3008
3010
switch (hparams.n_layer) {
3009
- case 24: model.type = e_model::MODEL_1B; break;
3011
+ case 24: model.type = hparams.n_embd == 1024 ? e_model::MODEL_0_5B : e_model::MODEL_1B; break;
3010
3012
case 32: model.type = e_model::MODEL_7B; break;
3011
- case 40: model.type = e_model::MODEL_13B; break;
3013
+ case 40: model.type = hparams.n_head == 20 ? e_model::MODEL_4B : e_model::MODEL_13B; break;
3012
3014
case 80: model.type = e_model::MODEL_70B; break;
3013
3015
default: model.type = e_model::MODEL_UNKNOWN;
3014
3016
}
You can’t perform that action at this time.
0 commit comments