From 589a6911ba4bacc4b53980dba403e7875e5f57b4 Mon Sep 17 00:00:00 2001
From: Hardik Shah <hjshah@meta.com>
Date: Fri, 31 Jan 2025 15:29:29 -0800
Subject: [PATCH] fix rag tests (#918)

make more deterministic
---
 tests/client-sdk/agents/test_agents.py | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/tests/client-sdk/agents/test_agents.py b/tests/client-sdk/agents/test_agents.py
index e0f86e3d7..b7f1c5b08 100644
--- a/tests/client-sdk/agents/test_agents.py
+++ b/tests/client-sdk/agents/test_agents.py
@@ -276,7 +276,7 @@ def test_rag_agent(llama_stack_client, agent_config):
         )
         for i, url in enumerate(urls)
     ]
-    vector_db_id = "test-vector-db"
+    vector_db_id = f"test-vector-db-{uuid4()}"
     llama_stack_client.vector_dbs.register(
         vector_db_id=vector_db_id,
         embedding_model="all-MiniLM-L6-v2",
@@ -286,7 +286,7 @@ def test_rag_agent(llama_stack_client, agent_config):
         documents=documents,
         vector_db_id=vector_db_id,
         # small chunks help to get specific info out of the docs
-        chunk_size_in_tokens=128,
+        chunk_size_in_tokens=256,
     )
     agent_config = {
         **agent_config,
@@ -304,9 +304,12 @@ def test_rag_agent(llama_stack_client, agent_config):
     user_prompts = [
         (
             "Instead of the standard multi-head attention, what attention type does Llama3-8B use?",
-            "grouped-query",
+            "grouped",
+        ),
+        (
+            "What `tune` command to use for getting access to Llama3-8B-Instruct ?",
+            "download",
         ),
-        ("What command to use to get access to Llama3-8B-Instruct ?", "tune download"),
     ]
     for prompt, expected_kw in user_prompts:
         print(f"User> {prompt}")