This repository was archived by the owner on Jun 5, 2025. It is now read-only.
File tree Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -189,7 +189,7 @@ jobs:
189
189
docker build -f Dockerfile.cpu -t vllm-cpu-env --shm-size=4g .
190
190
docker run -d --name vllm \
191
191
--network="host" \
192
- vllm-cpu-env --model Qwen/Qwen2.5-Coder-0.5B
192
+ vllm-cpu-env --model Qwen/Qwen2.5-Coder-0.5B-Instruct
193
193
194
194
- name : Verify the vllm container is running
195
195
run : |
@@ -205,7 +205,7 @@ jobs:
205
205
206
206
echo -e "\nVerify the completions endpoint works\n"
207
207
curl http://localhost:8000/v1/completions -H "Content-Type: application/json" -d '{
208
- "model": "Qwen/Qwen2.5-Coder-0.5B",
208
+ "model": "Qwen/Qwen2.5-Coder-0.5B-Instruct ",
209
209
"prompt": ["How to make pizza"],
210
210
"max_tokens": 100,
211
211
"temperature": 0
@@ -215,7 +215,7 @@ jobs:
215
215
curl -X POST http://localhost:8000/v1/chat/completions \
216
216
-H "Content-Type: application/json" \
217
217
-d '{
218
- "model": "Qwen/Qwen2.5-Coder-0.5B",
218
+ "model": "Qwen/Qwen2.5-Coder-0.5B-Instruct ",
219
219
"messages": [
220
220
{"role": "system", "content": "You are a coding assistant."},
221
221
{"role": "user", "content": "Hello"}
Original file line number Diff line number Diff line change @@ -161,7 +161,7 @@ testcases:
161
161
"role":"user"
162
162
}
163
163
],
164
- "model":"Qwen/Qwen2.5-Coder-0.5B",
164
+ "model":"Qwen/Qwen2.5-Coder-0.5B-Instruct ",
165
165
"stream":true,
166
166
"temperature":0
167
167
}
@@ -174,7 +174,7 @@ testcases:
174
174
url : http://127.0.0.1:8989/vllm/completions
175
175
data : |
176
176
{
177
- "model": "Qwen/Qwen2.5-Coder-0.5B",
177
+ "model": "Qwen/Qwen2.5-Coder-0.5B-Instruct ",
178
178
"max_tokens": 4096,
179
179
"temperature": 0,
180
180
"stream": true,
You can’t perform that action at this time.
0 commit comments