Skip to content
This repository was archived by the owner on Jun 5, 2025. It is now read-only.

Commit bb1708f

Browse files
committed
Use Qwen/Qwen2.5-Coder-1.5B-Instruct for vllm
Signed-off-by: Radoslav Dimitrov <radoslav@stacklok.com>
1 parent 27cf9e3 commit bb1708f

File tree

2 files changed

+7
-7
lines changed

2 files changed

+7
-7
lines changed

.github/workflows/integration-tests.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -223,15 +223,15 @@ jobs:
223223
224224
- name: Build and run the vllm container (vllm-only)
225225
if: ${{ matrix.test-provider == 'vllm' }} # This is only needed for VLLM
226-
timeout-minutes: 10
226+
timeout-minutes: 15
227227
run: |
228228
# We clone the VLLM repo and build the container because the CPU-mode container is not published
229229
git clone https://github.com/vllm-project/vllm.git
230230
cd vllm
231231
docker build -f Dockerfile.cpu -t vllm-cpu-env --shm-size=4g .
232232
docker run -d --name vllm \
233233
--network="host" \
234-
vllm-cpu-env --model Qwen/Qwen2.5-Coder-0.5B-Instruct
234+
vllm-cpu-env --model Qwen/Qwen2.5-Coder-1.5B-Instruct
235235
236236
echo -e "\nVerify the vllm container is serving\n"
237237
docker ps -f name=vllm
@@ -245,7 +245,7 @@ jobs:
245245
246246
echo -e "\nVerify the completions endpoint works\n"
247247
curl http://localhost:8000/v1/completions -H "Content-Type: application/json" -d '{
248-
"model": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
248+
"model": "Qwen/Qwen2.5-Coder-1.5B-Instruct",
249249
"prompt": ["How to make pizza"],
250250
"max_tokens": 100,
251251
"temperature": 0
@@ -255,7 +255,7 @@ jobs:
255255
curl -X POST http://localhost:8000/v1/chat/completions \
256256
-H "Content-Type: application/json" \
257257
-d '{
258-
"model": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
258+
"model": "Qwen/Qwen2.5-Coder-1.5B-Instruct",
259259
"messages": [
260260
{"role": "system", "content": "You are a coding assistant."},
261261
{"role": "user", "content": "Hello"}

tests/integration/vllm/testcases.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ testcases:
2020
"role":"user"
2121
}
2222
],
23-
"model":"Qwen/Qwen2.5-Coder-0.5B-Instruct",
23+
"model":"Qwen/Qwen2.5-Coder-1.5B-Instruct",
2424
"stream":true,
2525
"temperature":0
2626
}
@@ -33,7 +33,7 @@ testcases:
3333
url: http://127.0.0.1:8989/vllm/completions
3434
data: |
3535
{
36-
"model": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
36+
"model": "Qwen/Qwen2.5-Coder-1.5B-Instruct",
3737
"max_tokens": 4096,
3838
"temperature": 0,
3939
"stream": true,
@@ -80,7 +80,7 @@ testcases:
8080
"role":"user"
8181
}
8282
],
83-
"model":"Qwen/Qwen2.5-Coder-0.5B-Instruct",
83+
"model":"Qwen/Qwen2.5-Coder-1.5B-Instruct",
8484
"stream":true,
8585
"temperature":0
8686
}

0 commit comments

Comments
 (0)