convert: Fix handling of LLAMA2 vocab_size = -1

Nikolay Borisov · Nikolay Borisov · commit f36a777bbc20 · 2023-11-06T13:49:17.000+02:00
When vocab_size is detected to be -1 simply remove its value from the parsed params.json and fallback to using the tok_embeddings.weight. Fixes #3900
diff --git a/convert.py b/convert.py
@@ -253,6 +253,11 @@ def loadOriginalParamsJson(model: LazyModel, config_path: Path) -> Params:
         elif config["norm_eps"] in (1e-05, 1e-06):
             # LLaMA v2
             n_ctx = 4096
+            # For some reason FB writes -1 to vocab size for their LLAMA2 models
+            # simply remove this bogus value and let the return statement belo
+            # figure it out
+            if config["vocab_size"] == -1:
+                del config["vocab_size"]
         else:
             # LLaMA v1
             n_ctx = 2048