@@ -187,19 +187,19 @@ steps:
187
187
- examples/
188
188
commands :
189
189
- pip install tensorizer # for tensorizer test
190
- - python3 offline_inference/offline_inference .py
190
+ - python3 offline_inference/basic .py
191
191
- python3 offline_inference/cpu_offload.py
192
- - python3 offline_inference/offline_inference_chat .py
193
- - python3 offline_inference/offline_inference_with_prefix .py
192
+ - python3 offline_inference/chat .py
193
+ - python3 offline_inference/prefix_caching .py
194
194
- python3 offline_inference/llm_engine_example.py
195
- - python3 offline_inference/offline_inference_vision_language .py
196
- - python3 offline_inference/offline_inference_vision_language_multi_image .py
195
+ - python3 offline_inference/vision_language .py
196
+ - python3 offline_inference/vision_language_multi_image .py
197
197
- python3 other/tensorize_vllm_model.py --model facebook/opt-125m serialize --serialized-directory /tmp/ --suffix v1 && python3 other/tensorize_vllm_model.py --model facebook/opt-125m deserialize --path-to-tensors /tmp/vllm/facebook/opt-125m/v1/model.tensors
198
- - python3 offline_inference/offline_inference_encoder_decoder .py
199
- - python3 offline_inference/offline_inference_classification .py
200
- - python3 offline_inference/offline_inference_embedding .py
201
- - python3 offline_inference/offline_inference_scoring .py
202
- - python3 offline_inference/offline_profile .py --model facebook/opt-125m run_num_steps --num-steps 2
198
+ - python3 offline_inference/encoder_decoder .py
199
+ - python3 offline_inference/classification .py
200
+ - python3 offline_inference/embedding .py
201
+ - python3 offline_inference/scoring .py
202
+ - python3 offline_inference/profiling .py --model facebook/opt-125m run_num_steps --num-steps 2
203
203
204
204
- label : Prefix Caching Test # 9min
205
205
mirror_hardwares : [amd]
0 commit comments