fix playground for v1 (#799)

# What does this PR do? - update playground callsites for v1 api changes ## Test Plan ``` cd llama_stack/distribution/ui streamlit run app.py ``` https://github.com/user-attachments/assets/eace11c6-600a-42dc-b4e7-6948a706509f ## Sources Please link relevant resources if necessary. ## Before submitting - [ ] This PR fixes a typo or improves the docs (you can dismiss the other checks if that's the case). - [ ] Ran pre-commit to handle lint / formatting issues. - [ ] Read the [contributor guideline](https://github.com/meta-llama/llama-stack/blob/main/CONTRIBUTING.md), Pull Request section? - [ ] Updated relevant documentation. - [ ] Wrote necessary unit or integration tests.
2025-12-04 18:13:44 +00:00 · 2025-01-16 19:32:07 -08:00 · 2025-01-16 19:32:07 -08:00 · 9d574f4aee
commit 9d574f4aee
parent b2ac29b9da
5 changed files with 35 additions and 25 deletions
--- a/llama_stack/distribution/ui/page/playground/rag.py
+++ b/llama_stack/distribution/ui/page/playground/rag.py
@ -44,14 +44,21 @@ def rag_chat_page():
                ]

                providers = llama_stack_api.client.providers.list()
+                memory_provider = None
+
+                for x in providers:
+                    if x.api == "memory":
+                        memory_provider = x.provider_id
+
                llama_stack_api.client.memory_banks.register(
                    memory_bank_id=memory_bank_name,  # Use the user-provided name
                    params={
+                        "memory_bank_type": "vector",
                        "embedding_model": "all-MiniLM-L6-v2",
                        "chunk_size_in_tokens": 512,
                        "overlap_size_in_tokens": 64,
                    },
-                    provider_id=providers["memory"][0].provider_id,
+                    provider_id=memory_provider,
                )

                # insert documents using the custom bank name
@ -69,9 +76,6 @@ def rag_chat_page():
            "Select Memory Banks",
            memory_banks,
        )
-        memory_bank_configs = [
-            {"bank_id": bank_id, "type": "vector"} for bank_id in selected_memory_banks
-        ]

        available_models = llama_stack_api.client.models.list()
        available_models = [
@ -133,14 +137,13 @@ def rag_chat_page():
        sampling_params={
            "strategy": strategy,
        },
-        tools=[
-            {
-                "type": "memory",
-                "memory_bank_configs": memory_bank_configs,
-                "query_generator_config": {"type": "default", "sep": " "},
-                "max_tokens_in_context": 4096,
-                "max_chunks": 10,
-            }
+        toolgroups=[
+            dict(
+                name="builtin::memory",
+                args={
+                    "memory_bank_ids": [bank_id for bank_id in selected_memory_banks],
+                },
+            )
        ],
        tool_choice="auto",
        tool_prompt_format="json",
@ -179,7 +182,7 @@ def rag_chat_page():
            retrieval_response = ""
            for log in EventLogger().log(response):
                log.print()
-                if log.role == "memory_retrieval":
+                if log.role == "tool_execution":
                    retrieval_response += log.content.replace("====", "").strip()
                    retrieval_message_placeholder.info(retrieval_response)
                else: