feat: Enable ingestion of precomputed embeddings (#2317)

2025-07-09 23:25:58 +00:00 · 2025-05-31 04:03:37 -06:00 · 2025-05-31 04:03:37 -06:00 · 2818e444f2
commit 2818e444f2
parent dfdf854865
9 changed files with 366 additions and 15 deletions
--- a/llama_stack/providers/inline/tool_runtime/rag/memory.py
+++ b/llama_stack/providers/inline/tool_runtime/rag/memory.py
@ -146,7 +146,7 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
        ]
        for i, chunk in enumerate(chunks):
            metadata = chunk.metadata
-            tokens += metadata["token_count"]
+            tokens += metadata.get("token_count", 0)
            tokens += metadata.get("metadata_token_count", 0)

            if tokens > query_config.max_tokens_in_context: