mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 04:04:14 +00:00
ci: Switch vllm config to qwen3
It preforms better in tool calling and structured tests Signed-off-by: Derek Higgins <derekh@redhat.com>
This commit is contained in:
parent
7d9004f199
commit
666d6a6fc0
3 changed files with 6 additions and 10 deletions
9
.github/actions/setup-vllm/action.yml
vendored
9
.github/actions/setup-vllm/action.yml
vendored
|
@ -11,13 +11,14 @@ runs:
|
||||||
--name vllm \
|
--name vllm \
|
||||||
-p 8000:8000 \
|
-p 8000:8000 \
|
||||||
--privileged=true \
|
--privileged=true \
|
||||||
quay.io/higginsd/vllm-cpu:65393ee064 \
|
quay.io/higginsd/vllm-cpu:65393ee064-qwen3 \
|
||||||
--host 0.0.0.0 \
|
--host 0.0.0.0 \
|
||||||
--port 8000 \
|
--port 8000 \
|
||||||
--enable-auto-tool-choice \
|
--enable-auto-tool-choice \
|
||||||
--tool-call-parser llama3_json \
|
--tool-call-parser hermes \
|
||||||
--model /root/.cache/Llama-3.2-1B-Instruct \
|
--model /root/.cache/Qwen3-0.6B \
|
||||||
--served-model-name meta-llama/Llama-3.2-1B-Instruct
|
--served-model-name Qwen/Qwen3-0.6B \
|
||||||
|
--max-model-len 8192
|
||||||
|
|
||||||
# Wait for vllm to be ready
|
# Wait for vllm to be ready
|
||||||
echo "Waiting for vllm to be ready..."
|
echo "Waiting for vllm to be ready..."
|
||||||
|
|
|
@ -212,11 +212,6 @@ fi
|
||||||
echo "=== Running Integration Tests ==="
|
echo "=== Running Integration Tests ==="
|
||||||
EXCLUDE_TESTS="builtin_tool or safety_with_image or code_interpreter or test_rag"
|
EXCLUDE_TESTS="builtin_tool or safety_with_image or code_interpreter or test_rag"
|
||||||
|
|
||||||
# Additional exclusions for vllm setup
|
|
||||||
if [[ "$TEST_SETUP" == "vllm" ]]; then
|
|
||||||
EXCLUDE_TESTS="${EXCLUDE_TESTS} or test_inference_store_tool_calls"
|
|
||||||
fi
|
|
||||||
|
|
||||||
PYTEST_PATTERN="not( $EXCLUDE_TESTS )"
|
PYTEST_PATTERN="not( $EXCLUDE_TESTS )"
|
||||||
if [[ -n "$TEST_PATTERN" ]]; then
|
if [[ -n "$TEST_PATTERN" ]]; then
|
||||||
PYTEST_PATTERN="${PYTEST_PATTERN} and $TEST_PATTERN"
|
PYTEST_PATTERN="${PYTEST_PATTERN} and $TEST_PATTERN"
|
||||||
|
|
|
@ -78,7 +78,7 @@ SETUP_DEFINITIONS: dict[str, Setup] = {
|
||||||
"VLLM_URL": "http://localhost:8000/v1",
|
"VLLM_URL": "http://localhost:8000/v1",
|
||||||
},
|
},
|
||||||
defaults={
|
defaults={
|
||||||
"text_model": "vllm/meta-llama/Llama-3.2-1B-Instruct",
|
"text_model": "vllm/Qwen/Qwen3-0.6B",
|
||||||
"embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
|
"embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
|
||||||
},
|
},
|
||||||
),
|
),
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue