convert: Fix handling of LLAMA2 vocab_size = -1

Nikolay Borisov · Nikolay Borisov · commit 55a939d14283 · 2023-11-06T13:03:31.000+02:00
When vocab_size is detected to be -1 simply remove its value from the parsed params.json and fallback to using the tok_embeddings.weight. Fixes #3900
diff --git a/convert.py b/convert.py
@@ -254,6 +254,11 @@ def loadOriginalParamsJson(model: LazyModel, config_path: Path) -> Params:
         elif norm_eps == 1e-05 or norm_eps == 1e-06:
             # LLaMA v2
             n_ctx = 4096
+            # For some reason FB writes -1 to vocab size for their LLAMA2 models
+            # simply remove this bogus value and let the return statement belo
+            # figure it out
+            if config["vocab_size"] == -1:
+                del config["vocab_size"]
         else:
             # LLaMA v1
             n_ctx = 2048