mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 12:07:34 +00:00
test: improve test reliability and model compatibility
- Update earth question to be more specific with multiple choice format to prevent Llama-3.2-1B-Instruct from rambling about other planets - Skip test_text_chat_completion_structured_output as it sometimes times out during CI execution again with Llama-3.2-1B-Instruct on vllm Signed-off-by: Derek Higgins <derekh@redhat.com>
This commit is contained in:
parent
2f58d87c22
commit
8951765584
4 changed files with 5 additions and 5 deletions
|
@ -214,7 +214,7 @@ EXCLUDE_TESTS="builtin_tool or safety_with_image or code_interpreter or test_rag
|
||||||
|
|
||||||
# Additional exclusions for vllm setup
|
# Additional exclusions for vllm setup
|
||||||
if [[ "$TEST_SETUP" == "vllm" ]]; then
|
if [[ "$TEST_SETUP" == "vllm" ]]; then
|
||||||
EXCLUDE_TESTS="${EXCLUDE_TESTS} or test_inference_store_tool_calls"
|
EXCLUDE_TESTS="${EXCLUDE_TESTS} or test_inference_store_tool_calls or test_text_chat_completion_structured_output"
|
||||||
fi
|
fi
|
||||||
|
|
||||||
PYTEST_PATTERN="not( $EXCLUDE_TESTS )"
|
PYTEST_PATTERN="not( $EXCLUDE_TESTS )"
|
||||||
|
|
|
@ -29,7 +29,7 @@ class ResponsesTestCase(BaseModel):
|
||||||
basic_test_cases = [
|
basic_test_cases = [
|
||||||
pytest.param(
|
pytest.param(
|
||||||
ResponsesTestCase(
|
ResponsesTestCase(
|
||||||
input="Which planet do humans live on?",
|
input="Humans live on which planet: Mars, Venus, or Earth?",
|
||||||
expected="earth",
|
expected="earth",
|
||||||
),
|
),
|
||||||
id="earth",
|
id="earth",
|
||||||
|
@ -76,7 +76,7 @@ multi_turn_test_cases = [
|
||||||
input="", # Not used for multi-turn
|
input="", # Not used for multi-turn
|
||||||
expected="", # Not used for multi-turn
|
expected="", # Not used for multi-turn
|
||||||
turns=[
|
turns=[
|
||||||
("Which planet do humans live on?", "earth"),
|
("Humans live on which planet: Mars, Venus, or Earth?", "earth"),
|
||||||
("What is the name of the planet from your previous response?", "earth"),
|
("What is the name of the planet from your previous response?", "earth"),
|
||||||
],
|
],
|
||||||
),
|
),
|
||||||
|
|
|
@ -1,7 +1,7 @@
|
||||||
{
|
{
|
||||||
"non_streaming_01": {
|
"non_streaming_01": {
|
||||||
"data": {
|
"data": {
|
||||||
"question": "Which planet do humans live on?",
|
"question": "Humans live on which planet: Mars, Venus, or Earth?",
|
||||||
"expected": "Earth"
|
"expected": "Earth"
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
|
|
|
@ -1,7 +1,7 @@
|
||||||
{
|
{
|
||||||
"non_streaming_01": {
|
"non_streaming_01": {
|
||||||
"data": {
|
"data": {
|
||||||
"question": "Which planet do humans live on?",
|
"question": "Humans live on which planet: Mars, Venus, or Earth?",
|
||||||
"expected": "Earth"
|
"expected": "Earth"
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue