|  | 
| 4767 | 4767 |       { | 
| 4768 | 4768 |         "model_format": "pytorch", | 
| 4769 | 4769 |         "model_size_in_billions": 671, | 
|  | 4770 | +        "activated_size_in_billions": 37, | 
| 4770 | 4771 |         "model_src": { | 
| 4771 | 4772 |           "huggingface": { | 
| 4772 | 4773 |             "quantizations": [ | 
|  | 
| 4846 | 4847 |       { | 
| 4847 | 4848 |         "model_format": "pytorch", | 
| 4848 | 4849 |         "model_size_in_billions": 671, | 
|  | 4850 | +        "activated_size_in_billions": 37, | 
| 4849 | 4851 |         "model_src": { | 
| 4850 | 4852 |           "huggingface": { | 
| 4851 | 4853 |             "quantizations": [ | 
|  | 
| 4866 | 4868 |       { | 
| 4867 | 4869 |         "model_format": "awq", | 
| 4868 | 4870 |         "model_size_in_billions": 671, | 
|  | 4871 | +        "activated_size_in_billions": 37, | 
| 4869 | 4872 |         "model_src": { | 
| 4870 | 4873 |           "huggingface": { | 
| 4871 | 4874 |             "quantizations": [ | 
|  | 
| 4885 | 4888 |       { | 
| 4886 | 4889 |         "model_format": "ggufv2", | 
| 4887 | 4890 |         "model_size_in_billions": 671, | 
|  | 4891 | +        "activated_size_in_billions": 37, | 
| 4888 | 4892 |         "model_src": { | 
| 4889 | 4893 |           "huggingface": { | 
| 4890 | 4894 |             "quantizations": [ | 
|  | 
| 5215 | 5219 |       { | 
| 5216 | 5220 |         "model_format": "mlx", | 
| 5217 | 5221 |         "model_size_in_billions": 671, | 
|  | 5222 | +        "activated_size_in_billions": 37, | 
| 5218 | 5223 |         "model_src": { | 
| 5219 | 5224 |           "huggingface": { | 
| 5220 | 5225 |             "quantizations": [ | 
|  | 
| 5263 | 5268 |       { | 
| 5264 | 5269 |         "model_format": "pytorch", | 
| 5265 | 5270 |         "model_size_in_billions": 671, | 
|  | 5271 | +        "activated_size_in_billions": 37, | 
| 5266 | 5272 |         "model_src": { | 
| 5267 | 5273 |           "huggingface": { | 
| 5268 | 5274 |             "quantizations": [ | 
|  | 
| 5281 | 5287 |       { | 
| 5282 | 5288 |         "model_format": "gptq", | 
| 5283 | 5289 |         "model_size_in_billions": 671, | 
|  | 5290 | +        "activated_size_in_billions": 37, | 
| 5284 | 5291 |         "model_src": { | 
| 5285 | 5292 |           "huggingface": { | 
| 5286 | 5293 |             "quantizations": [ | 
|  | 
| 5311 | 5318 |     "reasoning_start_tag": "<think>", | 
| 5312 | 5319 |     "reasoning_end_tag": "</think>" | 
| 5313 | 5320 |   }, | 
|  | 5321 | +  { | 
|  | 5322 | +    "version": 2, | 
|  | 5323 | +    "context_length": 131072, | 
|  | 5324 | +    "model_name": "Deepseek-V3.1", | 
|  | 5325 | +    "model_lang": [ | 
|  | 5326 | +      "en", | 
|  | 5327 | +      "zh" | 
|  | 5328 | +    ], | 
|  | 5329 | +    "model_ability": [ | 
|  | 5330 | +      "chat", | 
|  | 5331 | +      "reasoning", | 
|  | 5332 | +      "hybrid", | 
|  | 5333 | +      "tools" | 
|  | 5334 | +    ], | 
|  | 5335 | +    "model_description": "DeepSeek-V3.1 is a hybrid model that supports both thinking mode and non-thinking mode.", | 
|  | 5336 | +    "model_specs": [ | 
|  | 5337 | +      { | 
|  | 5338 | +        "model_format": "pytorch", | 
|  | 5339 | +        "model_size_in_billions": 671, | 
|  | 5340 | +        "activated_size_in_billions": 37, | 
|  | 5341 | +        "model_src": { | 
|  | 5342 | +          "huggingface": { | 
|  | 5343 | +            "quantizations": [ | 
|  | 5344 | +              "none" | 
|  | 5345 | +            ], | 
|  | 5346 | +            "model_id": "deepseek-ai/DeepSeek-V3.1" | 
|  | 5347 | +          }, | 
|  | 5348 | +          "modelscope": { | 
|  | 5349 | +            "quantizations": [ | 
|  | 5350 | +              "none" | 
|  | 5351 | +            ], | 
|  | 5352 | +            "model_id": "deepseek-ai/DeepSeek-V3.1" | 
|  | 5353 | +          } | 
|  | 5354 | +        } | 
|  | 5355 | +      }, | 
|  | 5356 | +      { | 
|  | 5357 | +        "model_format": "gptq", | 
|  | 5358 | +        "model_size_in_billions": 671, | 
|  | 5359 | +        "activated_size_in_billions": 37, | 
|  | 5360 | +        "model_src": { | 
|  | 5361 | +          "huggingface": { | 
|  | 5362 | +            "quantizations": [ | 
|  | 5363 | +              "Int4" | 
|  | 5364 | +            ], | 
|  | 5365 | +            "model_id": "cpatonn/DeepSeek-V3.1-GPTQ-4bit" | 
|  | 5366 | +          }, | 
|  | 5367 | +          "modelscope": { | 
|  | 5368 | +            "quantizations": [ | 
|  | 5369 | +              "Int4" | 
|  | 5370 | +            ], | 
|  | 5371 | +            "model_id": "cpatonn/DeepSeek-V3.1-GPTQ-4bit" | 
|  | 5372 | +          } | 
|  | 5373 | +        } | 
|  | 5374 | +      }, | 
|  | 5375 | +      { | 
|  | 5376 | +        "model_format": "awq", | 
|  | 5377 | +        "model_size_in_billions": 671, | 
|  | 5378 | +        "activated_size_in_billions": 37, | 
|  | 5379 | +        "model_src": { | 
|  | 5380 | +          "huggingface": { | 
|  | 5381 | +            "quantizations": [ | 
|  | 5382 | +              "Int4" | 
|  | 5383 | +            ], | 
|  | 5384 | +            "model_id": "QuantTrio/DeepSeek-V3.1-AWQ" | 
|  | 5385 | +          }, | 
|  | 5386 | +          "modelscope": { | 
|  | 5387 | +            "quantizations": [ | 
|  | 5388 | +              "Int4" | 
|  | 5389 | +            ], | 
|  | 5390 | +            "model_id": "tclf90/DeepSeek-V3.1-AWQ" | 
|  | 5391 | +          } | 
|  | 5392 | +        } | 
|  | 5393 | +      }, | 
|  | 5394 | +      { | 
|  | 5395 | +        "model_format": "mlx", | 
|  | 5396 | +        "model_size_in_billions": 671, | 
|  | 5397 | +        "activated_size_in_billions": 37, | 
|  | 5398 | +        "model_src": { | 
|  | 5399 | +          "huggingface": { | 
|  | 5400 | +            "quantizations": [ | 
|  | 5401 | +              "8bit", | 
|  | 5402 | +              "4bit" | 
|  | 5403 | +            ], | 
|  | 5404 | +            "model_id": "mlx-community/DeepSeek-V3.1-{quantization}" | 
|  | 5405 | +          }, | 
|  | 5406 | +          "modelscope": { | 
|  | 5407 | +            "quantizations": [ | 
|  | 5408 | +              "8bit", | 
|  | 5409 | +              "4bit" | 
|  | 5410 | +            ], | 
|  | 5411 | +            "model_id": "mlx-community/DeepSeek-V3.1-{quantization}" | 
|  | 5412 | +          } | 
|  | 5413 | +        } | 
|  | 5414 | +      } | 
|  | 5415 | +    ], | 
|  | 5416 | +    "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% if not thinking is defined %}{% set thinking = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, system_prompt='', is_first_sp=true, is_last_user=false) %}{%- for message in messages %}{%- if message['role'] == 'system' %}{%- if ns.is_first_sp %}{% set ns.system_prompt = ns.system_prompt + message['content'] %}{% set ns.is_first_sp = false %}{%- else %}{% set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}{%- endif %}{%- endif %}{%- endfor %}{{ bos_token }}{{ ns.system_prompt }}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{%- set ns.is_first = false -%}{%- set ns.is_last_user = true -%}{{'<|User|>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}{%- if ns.is_last_user %}{{'<|Assistant|></think>'}}{%- endif %}{%- set ns.is_last_user = false -%}{%- set ns.is_first = false %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls'] %}{%- if not ns.is_first %}{%- if message['content'] is none %}{{'<|tool▁calls▁begin|><|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- else %}{{message['content'] + '<|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- endif %}{%- set ns.is_first = true -%}{%- else %}{{'<|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- endif %}{%- endfor %}{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}{%- endif %}{%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}{%- if ns.is_last_user %}{{'<|Assistant|>'}}{%- if message['prefix'] is defined and message['prefix'] and thinking %}{{'<think>'}}  {%- else %}{{'</think>'}}{%- endif %}{%- endif %}{%- set ns.is_last_user = false -%}{%- if ns.is_tool %}{{message['content'] + '<|end▁of▁sentence|>'}}{%- set ns.is_tool = false -%}{%- else %}{%- set content = message['content'] -%}{%- if '</think>' in content %}{%- set content = content.split('</think>', 1)[1] -%}{%- endif %}{{content + '<|end▁of▁sentence|>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_last_user = false -%}{%- set ns.is_tool = true -%}{{'<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- endif %}{%- endfor -%}{%- if add_generation_prompt and ns.is_last_user and not ns.is_tool %}{{'<|Assistant|>'}}{%- if not thinking %}{{'</think>'}}{%- else %}{{'<think>'}}{%- endif %}{% endif %}", | 
|  | 5417 | +    "stop_token_ids": [ | 
|  | 5418 | +      1 | 
|  | 5419 | +    ], | 
|  | 5420 | +    "stop": [ | 
|  | 5421 | +      "<|end▁of▁sentence|>" | 
|  | 5422 | +    ], | 
|  | 5423 | +    "reasoning_start_tag": "<think>", | 
|  | 5424 | +    "reasoning_end_tag": "</think>", | 
|  | 5425 | +    "virtualenv": { | 
|  | 5426 | +      "packages": [ | 
|  | 5427 | +        "transformers==4.53.0" | 
|  | 5428 | +      ] | 
|  | 5429 | +    } | 
|  | 5430 | +  }, | 
| 5314 | 5431 |   { | 
| 5315 | 5432 |     "version": 2, | 
| 5316 | 5433 |     "context_length": 131072, | 
|  | 
| 6242 | 6359 |       { | 
| 6243 | 6360 |         "model_format": "pytorch", | 
| 6244 | 6361 |         "model_size_in_billions": 671, | 
|  | 6362 | +        "activated_size_in_billions": 37, | 
| 6245 | 6363 |         "model_src": { | 
| 6246 | 6364 |           "huggingface": { | 
| 6247 | 6365 |             "quantizations": [ | 
|  | 
| 6262 | 6380 |       { | 
| 6263 | 6381 |         "model_format": "awq", | 
| 6264 | 6382 |         "model_size_in_billions": 671, | 
|  | 6383 | +        "activated_size_in_billions": 37, | 
| 6265 | 6384 |         "model_src": { | 
| 6266 | 6385 |           "huggingface": { | 
| 6267 | 6386 |             "quantizations": [ | 
|  | 
| 6281 | 6400 |       { | 
| 6282 | 6401 |         "model_format": "ggufv2", | 
| 6283 | 6402 |         "model_size_in_billions": 671, | 
|  | 6403 | +        "activated_size_in_billions": 37, | 
| 6284 | 6404 |         "model_src": { | 
| 6285 | 6405 |           "huggingface": { | 
| 6286 | 6406 |             "quantizations": [ | 
|  | 
| 6475 | 6595 |       { | 
| 6476 | 6596 |         "model_format": "mlx", | 
| 6477 | 6597 |         "model_size_in_billions": 671, | 
|  | 6598 | +        "activated_size_in_billions": 37, | 
| 6478 | 6599 |         "model_src": { | 
| 6479 | 6600 |           "huggingface": { | 
| 6480 | 6601 |             "quantizations": [ | 
|  | 
| 6517 | 6638 |       { | 
| 6518 | 6639 |         "model_format": "pytorch", | 
| 6519 | 6640 |         "model_size_in_billions": 671, | 
|  | 6641 | +        "activated_size_in_billions": 37, | 
| 6520 | 6642 |         "model_src": { | 
| 6521 | 6643 |           "huggingface": { | 
| 6522 | 6644 |             "quantizations": [ | 
|  | 
| 6535 | 6657 |       { | 
| 6536 | 6658 |         "model_format": "awq", | 
| 6537 | 6659 |         "model_size_in_billions": 671, | 
|  | 6660 | +        "activated_size_in_billions": 37, | 
| 6538 | 6661 |         "model_src": { | 
| 6539 | 6662 |           "huggingface": { | 
| 6540 | 6663 |             "quantizations": [ | 
|  | 
| 6553 | 6676 |       { | 
| 6554 | 6677 |         "model_format": "mlx", | 
| 6555 | 6678 |         "model_size_in_billions": 671, | 
|  | 6679 | +        "activated_size_in_billions": 37, | 
| 6556 | 6680 |         "model_src": { | 
| 6557 | 6681 |           "huggingface": { | 
| 6558 | 6682 |             "quantizations": [ | 
|  | 
0 commit comments