Skip to content

Commit e69ffba

Browse files
committed
convert-hf-to-gguf: add Viking-7b (using llama-bpe)
1 parent 3afb494 commit e69ffba

File tree

2 files changed

+6
-1
lines changed

2 files changed

+6
-1
lines changed

convert-hf-to-gguf-update.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -80,6 +80,7 @@ class TOKENIZER_TYPE(IntEnum):
8080
{"name": "jina-v2-en", "tokt": TOKENIZER_TYPE.WPM, "repo": "https://huggingface.co/jinaai/jina-embeddings-v2-base-en", }, # WPM!
8181
{"name": "jina-v2-es", "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/jinaai/jina-embeddings-v2-base-es", },
8282
{"name": "jina-v2-de", "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/jinaai/jina-embeddings-v2-base-de", },
83+
{"name": "viking-7b", "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/LumiOpen/Viking-7B", "type": "llama-bpe" },
8384
]
8485

8586

@@ -124,6 +125,7 @@ def download_model(model):
124125
src_ifs = ""
125126
for model in models:
126127
name = model["name"]
128+
model_type = model.get("type") or name
127129
tokt = model["tokt"]
128130

129131
if tokt == TOKENIZER_TYPE.SPM:
@@ -164,7 +166,7 @@ def download_model(model):
164166

165167
src_ifs += f" if chkhsh == \"{chkhsh}\":\n"
166168
src_ifs += f" # ref: {model['repo']}\n"
167-
src_ifs += f" res = \"{name}\"\n"
169+
src_ifs += f" res = \"{model_type}\"\n"
168170

169171
src_func = f"""
170172
def get_vocab_base_pre(self, tokenizer) -> str:

convert-hf-to-gguf.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -470,6 +470,9 @@ def get_vocab_base_pre(self, tokenizer) -> str:
470470
if chkhsh == "27949a2493fc4a9f53f5b9b029c82689cfbe5d3a1929bb25e043089e28466de6":
471471
# ref: https://huggingface.co/jinaai/jina-embeddings-v2-base-de
472472
res = "jina-v2-de"
473+
if chkhsh == "7fc505bd3104ca1083b150b17d088b59534ede9bde81f0dd2090967d7fe52cee":
474+
# ref: https://huggingface.co/LumiOpen/Viking-7B
475+
res = "llama-bpe"
473476

474477
if res is None:
475478
logger.warning("\n")

0 commit comments

Comments
 (0)