@@ -55,9 +55,18 @@ class _HfExamplesInfo:
5555 trust_remote_code : bool = False
5656 """The ``trust_remote_code`` level required to load the model."""
5757
58+ v0_only : bool = False
59+ """The model is only available with the vLLM V0 engine."""
60+
5861 hf_overrides : dict [str , Any ] = field (default_factory = dict )
5962 """The ``hf_overrides`` required to load the model."""
6063
64+ max_model_len : Optional [int ] = None
65+ """
66+ The maximum model length to use for this model. Some models default to a
67+ length that is too large to fit into memory in CI.
68+ """
69+
6170 def check_transformers_version (
6271 self ,
6372 * ,
@@ -215,10 +224,11 @@ def check_available_online(
215224 "OrionForCausalLM" : _HfExamplesInfo ("OrionStarAI/Orion-14B-Chat" ,
216225 trust_remote_code = True ),
217226 "PersimmonForCausalLM" : _HfExamplesInfo ("adept/persimmon-8b-chat" ),
218- "PhiForCausalLM" : _HfExamplesInfo ("microsoft/phi-2" ),
227+ "PhiForCausalLM" : _HfExamplesInfo ("microsoft/phi-2" , v0_only = True ),
219228 "Phi3ForCausalLM" : _HfExamplesInfo ("microsoft/Phi-3-mini-4k-instruct" ),
220229 "Phi3SmallForCausalLM" : _HfExamplesInfo ("microsoft/Phi-3-small-8k-instruct" ,
221- trust_remote_code = True ),
230+ trust_remote_code = True ,
231+ v0_only = True ),
222232 "PhiMoEForCausalLM" : _HfExamplesInfo ("microsoft/Phi-3.5-MoE-instruct" ,
223233 trust_remote_code = True ),
224234 "Plamo2ForCausalLM" : _HfExamplesInfo ("pfnet/plamo-2-1b" ,
@@ -234,7 +244,8 @@ def check_available_online(
234244 is_available_online = False ),
235245 "StableLMEpochForCausalLM" : _HfExamplesInfo ("stabilityai/stablelm-zephyr-3b" , # noqa: E501
236246 is_available_online = False ),
237- "StableLmForCausalLM" : _HfExamplesInfo ("stabilityai/stablelm-3b-4e1t" ),
247+ "StableLmForCausalLM" : _HfExamplesInfo ("stabilityai/stablelm-3b-4e1t" ,
248+ v0_only = True ),
238249 "Starcoder2ForCausalLM" : _HfExamplesInfo ("bigcode/starcoder2-3b" ),
239250 "SolarForCausalLM" : _HfExamplesInfo ("upstage/solar-pro-preview-instruct" ),
240251 "TeleChat2ForCausalLM" : _HfExamplesInfo ("Tele-AI/TeleChat2-3B" ,
@@ -303,7 +314,8 @@ def check_available_online(
303314 "AriaForConditionalGeneration" : _HfExamplesInfo ("rhymes-ai/Aria" ),
304315 "AyaVisionForConditionalGeneration" : _HfExamplesInfo ("CohereForAI/aya-vision-8b" ), # noqa: E501
305316 "Blip2ForConditionalGeneration" : _HfExamplesInfo ("Salesforce/blip2-opt-2.7b" , # noqa: E501
306- extras = {"6b" : "Salesforce/blip2-opt-6.7b" }), # noqa: E501
317+ extras = {"6b" : "Salesforce/blip2-opt-6.7b" }, # noqa: E501
318+ v0_only = True ),
307319 "ChameleonForConditionalGeneration" : _HfExamplesInfo ("facebook/chameleon-7b" ), # noqa: E501
308320 "DeepseekVLV2ForCausalLM" : _HfExamplesInfo ("deepseek-ai/deepseek-vl2-tiny" , # noqa: E501
309321 extras = {"fork" : "Isotr0py/deepseek-vl2-tiny" }, # noqa: E501
@@ -328,9 +340,11 @@ def check_available_online(
328340 {"tiny" : "HuggingFaceTB/SmolVLM-256M-Instruct" }), # noqa: E501
329341 "KimiVLForConditionalGeneration" : _HfExamplesInfo ("moonshotai/Kimi-VL-A3B-Instruct" , # noqa: E501
330342 extras = {"thinking" : "moonshotai/Kimi-VL-A3B-Thinking" }, # noqa: E501
331- trust_remote_code = True ),
343+ trust_remote_code = True ,
344+ v0_only = True ),
332345 "Llama4ForConditionalGeneration" : _HfExamplesInfo ("meta-llama/Llama-4-Scout-17B-16E-Instruct" , # noqa: E501
333- min_transformers_version = "4.51" ),
346+ min_transformers_version = "4.51" ,
347+ max_model_len = 10240 ),
334348 "LlavaForConditionalGeneration" : _HfExamplesInfo ("llava-hf/llava-1.5-7b-hf" ,
335349 extras = {"mistral" : "mistral-community/pixtral-12b" , # noqa: E501
336350 "mistral-fp8" : "nm-testing/pixtral-12b-FP8-dynamic" }), # noqa: E501
@@ -349,7 +363,8 @@ def check_available_online(
349363 extras = {"2.6" : "openbmb/MiniCPM-V-2_6" }, # noqa: E501
350364 trust_remote_code = True ),
351365 "MiniMaxVL01ForConditionalGeneration" : _HfExamplesInfo ("MiniMaxAI/MiniMax-VL-01" , # noqa: E501
352- trust_remote_code = True ),
366+ trust_remote_code = True ,
367+ v0_only = True ),
353368 "Mistral3ForConditionalGeneration" : _HfExamplesInfo ("mistralai/Mistral-Small-3.1-24B-Instruct-2503" , # noqa: E501
354369 extras = {"fp8" : "nm-testing/Mistral-Small-3.1-24B-Instruct-2503-FP8-dynamic" }), # noqa: E501
355370 "MolmoForCausalLM" : _HfExamplesInfo ("allenai/Molmo-7B-D-0924" ,
@@ -372,7 +387,8 @@ def check_available_online(
372387 "Phi4MMForCausalLM" : _HfExamplesInfo ("microsoft/Phi-4-multimodal-instruct" ,
373388 trust_remote_code = True ),
374389 "PixtralForConditionalGeneration" : _HfExamplesInfo ("mistralai/Pixtral-12B-2409" , # noqa: E501
375- tokenizer_mode = "mistral" ),
390+ tokenizer_mode = "mistral" ,
391+ v0_only = True ),
376392 "QwenVLForConditionalGeneration" : _HfExamplesInfo ("Qwen/Qwen-VL" ,
377393 extras = {"chat" : "Qwen/Qwen-VL-Chat" }, # noqa: E501
378394 trust_remote_code = True ,
0 commit comments