@@ -187,19 +187,19 @@ steps:
187
187
- examples/
188
188
commands :
189
189
- pip install tensorizer # for tensorizer test
190
- - python3 offline_inference.py
191
- - python3 cpu_offload.py
192
- - python3 offline_inference_chat.py
193
- - python3 offline_inference_with_prefix.py
194
- - python3 llm_engine_example.py
195
- - python3 offline_inference_vision_language.py
196
- - python3 offline_inference_vision_language_multi_image.py
197
- - python3 tensorize_vllm_model.py --model facebook/opt-125m serialize --serialized-directory /tmp/ --suffix v1 && python3 tensorize_vllm_model.py --model facebook/opt-125m deserialize --path-to-tensors /tmp/vllm/facebook/opt-125m/v1/model.tensors
198
- - python3 offline_inference_encoder_decoder.py
199
- - python3 offline_inference_classification.py
200
- - python3 offline_inference_embedding.py
201
- - python3 offline_inference_scoring.py
202
- - python3 offline_profile.py --model facebook/opt-125m run_num_steps --num-steps 2
190
+ - python3 offline_inference/offline_inference .py
191
+ - python3 offline_inference/ cpu_offload.py
192
+ - python3 offline_inference/ offline_inference_chat.py
193
+ - python3 offline_inference/ offline_inference_with_prefix.py
194
+ - python3 offline_inference/ llm_engine_example.py
195
+ - python3 offline_inference/ offline_inference_vision_language.py
196
+ - python3 offline_inference/ offline_inference_vision_language_multi_image.py
197
+ - python3 other/ tensorize_vllm_model.py --model facebook/opt-125m serialize --serialized-directory /tmp/ --suffix v1 && python3 other/ tensorize_vllm_model.py --model facebook/opt-125m deserialize --path-to-tensors /tmp/vllm/facebook/opt-125m/v1/model.tensors
198
+ - python3 offline_inference/ offline_inference_encoder_decoder.py
199
+ - python3 offline_inference/ offline_inference_classification.py
200
+ - python3 offline_inference/ offline_inference_embedding.py
201
+ - python3 offline_inference/ offline_inference_scoring.py
202
+ - python3 offline_inference/ offline_profile.py --model facebook/opt-125m run_num_steps --num-steps 2
203
203
204
204
- label : Prefix Caching Test # 9min
205
205
mirror_hardwares : [amd]
0 commit comments