mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 12:07:34 +00:00
389 KiB
389 KiB
Uninstalled 3 packages in 114ms
Installed 3 packages in 165ms
INFO 2025-09-10 14:47:19,351 llama_stack.core.utils.config_resolution:52 core: Using distribution:
/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
INFO 2025-09-10 14:47:19,353 llama_stack.cli.stack.run:129 cli: Using run configuration:
/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
Using virtual environment: /Users/kaiwu/work/kaiwu/llama-stack/.venv
Virtual environment already activated
+ '[' -n /Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml ']'
+ yaml_config_arg=/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
+ python -m llama_stack.core.server.server /Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml --port 8321
INFO 2025-09-10 14:47:23,918 llama_stack.core.utils.config_resolution:45 core: Using file path:
/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
INFO 2025-09-10 14:47:23,929 __main__:615 core::server: Run configuration:
INFO 2025-09-10 14:47:23,933 __main__:618 core::server: apis:
- agents
- batches
- datasetio
- eval
- files
- inference
- post_training
- safety
- scoring
- telemetry
- tool_runtime
- vector_io
benchmarks: []
datasets: []
image_name: starter
inference_store:
db_path: /Users/kaiwu/.llama/distributions/starter/inference_store.db
type: sqlite
metadata_store:
db_path: /Users/kaiwu/.llama/distributions/starter/registry.db
type: sqlite
models: []
providers:
agents:
- config:
persistence_store:
db_path: /Users/kaiwu/.llama/distributions/starter/agents_store.db
type: sqlite
responses_store:
db_path: /Users/kaiwu/.llama/distributions/starter/responses_store.db
type: sqlite
provider_id: meta-reference
provider_type: inline::meta-reference
batches:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/batches.db
type: sqlite
provider_id: reference
provider_type: inline::reference
datasetio:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/huggingface_datasetio.db
type: sqlite
provider_id: huggingface
provider_type: remote::huggingface
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/localfs_datasetio.db
type: sqlite
provider_id: localfs
provider_type: inline::localfs
eval:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/meta_reference_eval.db
type: sqlite
provider_id: meta-reference
provider_type: inline::meta-reference
files:
- config:
metadata_store:
db_path: /Users/kaiwu/.llama/distributions/starter/files_metadata.db
type: sqlite
storage_dir: /Users/kaiwu/.llama/distributions/starter/files
provider_id: meta-reference-files
provider_type: inline::localfs
inference:
- config:
api_key: '********'
url: https://api.fireworks.ai/inference/v1
provider_id: fireworks
provider_type: remote::fireworks
- config:
api_key: '********'
url: https://api.together.xyz/v1
provider_id: together
provider_type: remote::together
- config: {}
provider_id: bedrock
provider_type: remote::bedrock
- config:
api_key: '********'
base_url: https://api.openai.com/v1
provider_id: openai
provider_type: remote::openai
- config:
api_key: '********'
provider_id: anthropic
provider_type: remote::anthropic
- config:
api_key: '********'
provider_id: gemini
provider_type: remote::gemini
- config:
api_key: '********'
url: https://api.groq.com
provider_id: groq
provider_type: remote::groq
- config:
api_key: '********'
url: https://api.sambanova.ai/v1
provider_id: sambanova
provider_type: remote::sambanova
- config: {}
provider_id: sentence-transformers
provider_type: inline::sentence-transformers
post_training:
- config:
checkpoint_format: meta
provider_id: torchtune-cpu
provider_type: inline::torchtune-cpu
safety:
- config:
excluded_categories: []
provider_id: llama-guard
provider_type: inline::llama-guard
- config: {}
provider_id: code-scanner
provider_type: inline::code-scanner
scoring:
- config: {}
provider_id: basic
provider_type: inline::basic
- config: {}
provider_id: llm-as-judge
provider_type: inline::llm-as-judge
- config:
openai_api_key: '********'
provider_id: braintrust
provider_type: inline::braintrust
telemetry:
- config:
service_name: "\u200B"
sinks: console,sqlite
sqlite_db_path: /Users/kaiwu/.llama/distributions/starter/trace_store.db
provider_id: meta-reference
provider_type: inline::meta-reference
tool_runtime:
- config:
api_key: '********'
max_results: 3
provider_id: brave-search
provider_type: remote::brave-search
- config:
api_key: '********'
max_results: 3
provider_id: tavily-search
provider_type: remote::tavily-search
- config: {}
provider_id: rag-runtime
provider_type: inline::rag-runtime
- config: {}
provider_id: model-context-protocol
provider_type: remote::model-context-protocol
vector_io:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/faiss_store.db
type: sqlite
provider_id: faiss
provider_type: inline::faiss
- config:
db_path: /Users/kaiwu/.llama/distributions/starter/sqlite_vec.db
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/sqlite_vec_registry.db
type: sqlite
provider_id: sqlite-vec
provider_type: inline::sqlite-vec
scoring_fns: []
server:
port: 8321
shields: []
tool_groups:
- provider_id: tavily-search
toolgroup_id: builtin::websearch
- provider_id: rag-runtime
toolgroup_id: builtin::rag
vector_dbs: []
version: 2
INFO 2025-09-10 14:47:34,785 llama_stack.core.stack:388 core: starting registry refresh task
INFO 2025-09-10 14:47:34,946 __main__:580 core::server: Listening on ['::', '0.0.0.0']:8321
INFO 2025-09-10 14:47:35,196 uvicorn.error:84 uncategorized: Started server process [26795]
INFO 2025-09-10 14:47:35,197 uvicorn.error:48 uncategorized: Waiting for application startup.
INFO 2025-09-10 14:47:35,198 __main__:168 core::server: Starting up
INFO 2025-09-10 14:47:35,199 uvicorn.error:62 uncategorized: Application startup complete.
INFO 2025-09-10 14:47:35,199 uvicorn.error:216 uncategorized: Uvicorn running on http://['::', '0.0.0.0']:8321 (Press CTRL+C to quit)
INFO 2025-09-10 14:47:36,852 uvicorn.access:473 uncategorized: 127.0.0.1:55733 - "GET /v1/health HTTP/1.1" 200
INFO 2025-09-10 14:47:36,854 console_span_processor:28 telemetry: 21:47:36.854 [START] /v1/health
INFO 2025-09-10 14:47:36,862 console_span_processor:39 telemetry: 21:47:36.855 [END] /v1/health [StatusCode.OK] (1.07ms)
INFO 2025-09-10 14:47:36,865 console_span_processor:48 telemetry: raw_path: /v1/health
INFO 2025-09-10 14:47:36,866 console_span_processor:62 telemetry: 21:47:36.853 [INFO] 127.0.0.1:55733 - "GET /v1/health HTTP/1.1" 200
INFO 2025-09-10 14:48:28,324 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "GET /v1/models HTTP/1.1" 200
INFO 2025-09-10 14:48:28,333 console_span_processor:28 telemetry: 21:48:28.332 [START] /v1/models
INFO 2025-09-10 14:48:28,392 console_span_processor:39 telemetry: 21:48:28.334 [END] ModelsRoutingTable.list_models [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:48:28,410 console_span_processor:48 telemetry: output: {'data': [{'identifier': 'llama_api/Llama-3.3-70B-Instruct',
'provider_resource_id': 'Llama-3.3-70B-Instruct', 'provider_id': 'llama_api', 'type': 'model', 'metadata': {}, 'model_type': 'llm'},
{'identifier': 'llama_api/Llama-4-Maverick-17B-128E-Instruct-FP8', 'provider_resource_id': 'Llama-4-Maverick-17B-128E-Instruct-FP8',
'provider_id': 'llama_api', 'type': 'model', 'metadata': {}, 'model_type': 'llm'}, {'identifier':
'llama_api/Llama-4-Scout-17B-16E-Instruct-FP8', 'provider_resource_id': 'Llama-4-Scout-17B-16E-Instruct-FP8', 'provider_id': 'llama_api',
'type': 'model', 'metadata': {}, 'model_type': 'llm'}, {'identifier': 'meta-llama/Llama-3.3-70B-Instruct', 'provider_resource_id':
'Llama-3.3-70B-Instruct', 'provider_id': 'meta-llama', 'type': 'model', 'metadata': {}, 'model_type': 'llm'}, {'identifier':
'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'provider_resource_id': 'Llama-4-Maverick-17B-128E-Instruct-FP8', 'provider_id':
'meta-llama', 'type': 'model', 'metadata': {...
INFO 2025-09-10 14:48:28,426 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "GET /v1/shields HTTP/1.1" 200
INFO 2025-09-10 14:48:28,465 console_span_processor:39 telemetry: 21:48:28.430 [END] /v1/models [StatusCode.OK] (97.81ms)
INFO 2025-09-10 14:48:28,466 console_span_processor:48 telemetry: raw_path: /v1/models
INFO 2025-09-10 14:48:28,466 console_span_processor:62 telemetry: 21:48:28.330 [INFO] 127.0.0.1:56006 - "GET /v1/models HTTP/1.1" 200
INFO 2025-09-10 14:48:28,468 console_span_processor:28 telemetry: 21:48:28.468 [START] /v1/shields
INFO 2025-09-10 14:48:28,523 console_span_processor:39 telemetry: 21:48:28.469 [END] ShieldsRoutingTable.list_shields [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:48:28,524 console_span_processor:48 telemetry: output: {'data': []}
INFO 2025-09-10 14:48:28,535 console_span_processor:39 telemetry: 21:48:28.527 [END] /v1/shields [StatusCode.OK] (59.54ms)
INFO 2025-09-10 14:48:28,536 console_span_processor:48 telemetry: raw_path: /v1/shields
INFO 2025-09-10 14:48:28,536 console_span_processor:62 telemetry: 21:48:28.427 [INFO] 127.0.0.1:56006 - "GET /v1/shields HTTP/1.1" 200
INFO 2025-09-10 14:48:32,432 console_span_processor:28 telemetry: 21:48:32.432 [START] /v1/openai/v1/files
WARNING 2025-09-10 14:48:32,437 __main__:220 core::server: Could not read or log request body for POST /v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,495 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
WARNING 2025-09-10 14:48:32,502 __main__:220 core::server: Could not read or log request body for POST /v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,514 console_span_processor:39 telemetry: 21:48:32.496 [END] LocalfsFilesImpl.openai_upload_file [StatusCode.OK] (55.21ms)
INFO 2025-09-10 14:48:32,515 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-489db9aae0424745960e3408ff0f477f',
'bytes': 41, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'shipping_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:48:32,523 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,526 console_span_processor:39 telemetry: 21:48:32.516 [END] /v1/openai/v1/files [StatusCode.OK] (84.71ms)
INFO 2025-09-10 14:48:32,528 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/files
INFO 2025-09-10 14:48:32,529 console_span_processor:62 telemetry: 21:48:32.440 [WARN] Could not read or log request body for POST
/v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,529 console_span_processor:62 telemetry: 21:48:32.496 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
WARNING 2025-09-10 14:48:32,531 __main__:220 core::server: Could not read or log request body for POST /v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,532 console_span_processor:28 telemetry: 21:48:32.532 [START] /v1/openai/v1/files
INFO 2025-09-10 14:48:32,540 console_span_processor:39 telemetry: 21:48:32.533 [END] LocalfsFilesImpl.openai_upload_file [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:48:32,545 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-b2f38b0e164347f5a2b6bbe211e33ff3',
'bytes': 48, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'returns_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:48:32,546 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,557 console_span_processor:39 telemetry: 21:48:32.547 [END] /v1/openai/v1/files [StatusCode.OK] (15.42ms)
INFO 2025-09-10 14:48:32,560 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/files
INFO 2025-09-10 14:48:32,562 console_span_processor:62 telemetry: 21:48:32.502 [WARN] Could not read or log request body for POST
/v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,562 console_span_processor:62 telemetry: 21:48:32.526 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,563 console_span_processor:28 telemetry: 21:48:32.563 [START] /v1/openai/v1/files
INFO 2025-09-10 14:48:32,581 console_span_processor:39 telemetry: 21:48:32.565 [END] LocalfsFilesImpl.openai_upload_file [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:48:32,582 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-6f6f157d165a4078b4abef66a095ccd6',
'bytes': 45, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'support.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:48:32,592 console_span_processor:39 telemetry: 21:48:32.584 [END] /v1/openai/v1/files [StatusCode.OK] (20.86ms)
INFO 2025-09-10 14:48:32,592 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/files
INFO 2025-09-10 14:48:32,593 console_span_processor:62 telemetry: 21:48:32.531 [WARN] Could not read or log request body for POST
/v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,594 console_span_processor:62 telemetry: 21:48:32.546 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,595 console_span_processor:28 telemetry: 21:48:32.595 [START] /v1/openai/v1/vector_stores
INFO 2025-09-10 14:48:32,601 console_span_processor:39 telemetry: 21:48:32.596 [END] FaissVectorIOAdapter.register_vector_db [StatusCode.OK]
(0.15ms)
INFO 2025-09-10 14:48:32,602 console_span_processor:48 telemetry: output:
INFO 2025-09-10 14:48:32,621 console_span_processor:39 telemetry: 21:48:32.604 [END] VectorDBsRoutingTable.register_vector_db [StatusCode.OK]
(8.25ms)
INFO 2025-09-10 14:48:32,622 console_span_processor:48 telemetry: output: {'identifier': 'vs_dab05212-db05-402c-91ef-57e41797406b',
'provider_resource_id': 'vs_dab05212-db05-402c-91ef-57e41797406b', 'provider_id': 'faiss', 'type': 'vector_db', 'owner': None, 'source':
'via_register_api', 'embedding_model': 'sentence-transformers/all-MiniLM-L6-v2', 'embedding_dimension': 384, 'vector_db_name': 'acme_docs'}
INFO 2025-09-10 14:48:32,631 console_span_processor:39 telemetry: 21:48:32.629 [END] FaissVectorIOAdapter.register_vector_db [StatusCode.OK]
(5.84ms)
INFO 2025-09-10 14:48:32,632 console_span_processor:48 telemetry: output:
INFO 2025-09-10 14:48:32,650 console_span_processor:39 telemetry: 21:48:32.640 [END] LocalfsFilesImpl.openai_retrieve_file [StatusCode.OK]
(2.11ms)
INFO 2025-09-10 14:48:32,655 llama_stack.providers.utils.inference.embedding_mixin:103 providers::utils: Loading sentence transformer for
all-MiniLM-L6-v2...
INFO 2025-09-10 14:48:32,660 console_span_processor:39 telemetry: 21:48:32.651 [END] LocalfsFilesImpl.openai_retrieve_file_content [StatusCode.OK]
(0.22ms)
INFO 2025-09-10 14:48:32,662 console_span_processor:39 telemetry: 21:48:32.661 [END] LocalfsFilesImpl.openai_retrieve_file_content [StatusCode.OK]
(0.23ms)
INFO 2025-09-10 14:48:32,670 console_span_processor:39 telemetry: 21:48:32.664 [END] LocalfsFilesImpl.openai_retrieve_file_content [StatusCode.OK]
(0.20ms)
INFO 2025-09-10 14:48:32,674 console_span_processor:39 telemetry: 21:48:32.672 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.77ms)
INFO 2025-09-10 14:48:32,675 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:48:32,681 console_span_processor:39 telemetry: 21:48:32.677 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.36ms)
INFO 2025-09-10 14:48:32,682 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:48:32,690 console_span_processor:39 telemetry: 21:48:32.683 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.23ms)
INFO 2025-09-10 14:48:32,690 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
WARNING 2025-09-10 14:48:59,202 torchao.kernel.intmm:23 uncategorized: Warning: Detected no triton, on systems without Triton certain kernels will
not work
W0910 14:48:59.847000 26795 torch/distributed/elastic/multiprocessing/redirects.py:29] NOTE: Redirects are currently not supported in Windows or MacOs.
INFO 2025-09-10 14:49:05,098 sentence_transformers.SentenceTransformer:219 uncategorized: Use pytorch device_name: mps
INFO 2025-09-10 14:49:05,099 sentence_transformers.SentenceTransformer:227 uncategorized: Load pretrained SentenceTransformer: all-MiniLM-L6-v2
INFO 2025-09-10 14:49:09,461 console_span_processor:39 telemetry: 21:49:09.453 [END] InferenceRouter.openai_embeddings [StatusCode.OK]
(36781.46ms)
INFO 2025-09-10 14:49:09,462 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371,
-0.03415430337190628, -0.10541579872369766, 0.0700988844037056, -0.03148755803704262, 0.07130879163742065, -0.0025789395440369844, 0.00581...
INFO 2025-09-10 14:49:09,463 console_span_processor:62 telemetry: 21:48:32.656 [INFO] Loading sentence transformer for all-MiniLM-L6-v2...
INFO 2025-09-10 14:49:09,464 console_span_processor:62 telemetry: 21:48:59.203 [WARN] Warning: Detected no triton, on systems without Triton
certain kernels will not work
INFO 2025-09-10 14:49:09,464 console_span_processor:62 telemetry: 21:49:05.099 [INFO] Use pytorch device_name: mps
INFO 2025-09-10 14:49:09,465 console_span_processor:62 telemetry: 21:49:05.100 [INFO] Load pretrained SentenceTransformer: all-MiniLM-L6-v2
INFO 2025-09-10 14:49:09,469 console_span_processor:39 telemetry: 21:49:09.468 [END] FaissVectorIOAdapter.insert_chunks [StatusCode.OK]
(36796.60ms)
INFO 2025-09-10 14:49:09,484 console_span_processor:39 telemetry: 21:49:09.480 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:49:09,484 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,488 console_span_processor:39 telemetry: 21:49:09.486 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:49:09,488 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:49:09,492 console_span_processor:39 telemetry: 21:49:09.490 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.58ms)
INFO 2025-09-10 14:49:09,493 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,924 console_span_processor:39 telemetry: 21:49:09.921 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (441.92ms)
INFO 2025-09-10 14:49:09,926 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.050018310546875, 0.0007208543829619884, 0.048539839684963226, 0.013606906868517399, -0.006504438817501068, 0.004046895541250706,
-0.04984626919031143, -8.024782437132671e-05, -0.02159256860613823, 0.0015519573353230953, 0.10069309175014496, 0.04437215253710747,
-0.022335151210427284, -0.05230937898159027, -0.028983373194932938, -0.049531035125255585, 0.03074926696717739, -0.03056054376065731,
0.021489247679710388, 0.016868554055690765, -0.028984908014535904, -0.07053273916244507, -0.022961033508181572, -0.0717858299612999,
0.0674479678273201, 0.021412895992398262, -0.06054700165987015, 0.021910998970270157, -0.023192649707198143, -0.028992125764489174,
0.025179730728268623, -0.006338999141007662, -0.001874048844911158, 0.009305929765105247, 0.011422501876950264, 0.037604980170726776,
-0.039689771831035614, -0.08734020590782166, -2.2408454242395237e-05, -0.027818966656923294, -0.05882560834288597, 0.0047395736910402...
INFO 2025-09-10 14:49:09,935 console_span_processor:39 telemetry: 21:49:09.928 [END] FaissVectorIOAdapter.insert_chunks [StatusCode.OK] (448.38ms)
INFO 2025-09-10 14:49:09,938 console_span_processor:39 telemetry: 21:49:09.936 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:49:09,939 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,944 console_span_processor:39 telemetry: 21:49:09.942 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.34ms)
INFO 2025-09-10 14:49:09,945 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:49:09,947 console_span_processor:39 telemetry: 21:49:09.946 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:49:09,948 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,959 console_span_processor:39 telemetry: 21:49:09.949 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (13.11ms)
INFO 2025-09-10 14:49:09,960 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.07958973944187164, -0.09508923441171646, 0.0747891291975975, -0.0033136801794171333, 0.03454456478357315, 0.041140977293252945,
-0.06803964823484421, 0.014224942773580551, -0.06238540634512901, 0.03782016783952713, -0.030075553804636, 0.07446419447660446,
-0.06111196056008339, 0.029801342636346817, 0.11399323493242264, 0.01820552721619606, 0.00257650064304471, -0.08268020302057266,
-0.08060702681541443, 0.004656659439206123, -0.053371429443359375, -0.03258609026670456, -0.024163667112588882, 0.0012904119212180376,
0.022314254194498062, -0.04680437222123146, -0.03445201367139816, 0.004914817865937948, -0.03131281957030296, 0.010677368380129337,
-0.011123362928628922, -0.022707175463438034, -0.0027590240351855755, 0.014538224786520004, 0.00694124773144722, -0.0027126462664455175,
0.023252086713910103, 0.07095751911401749, -0.030273273587226868, -0.04118560254573822, -0.04669591784477234, -0.028823204338550568,
-0.010...
INFO 2025-09-10 14:49:09,974 console_span_processor:39 telemetry: 21:49:09.961 [END] FaissVectorIOAdapter.insert_chunks [StatusCode.OK] (25.74ms)
INFO 2025-09-10 14:49:09,980 console_span_processor:39 telemetry: 21:49:09.975 [END] LocalfsFilesImpl.openai_retrieve_file [StatusCode.OK]
(37339.17ms)
INFO 2025-09-10 14:49:09,981 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-b2f38b0e164347f5a2b6bbe211e33ff3',
'bytes': 48, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'returns_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:49:09,987 console_span_processor:39 telemetry: 21:49:09.982 [END] LocalfsFilesImpl.openai_retrieve_file [StatusCode.OK]
(37346.24ms)
INFO 2025-09-10 14:49:09,988 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-489db9aae0424745960e3408ff0f477f',
'bytes': 41, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'shipping_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:49:10,038 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/vector_stores HTTP/1.1" 200
INFO 2025-09-10 14:49:10,041 console_span_processor:39 telemetry: 21:49:10.039 [END] VectorIORouter.openai_create_vector_store [StatusCode.OK]
(37443.86ms)
INFO 2025-09-10 14:49:10,042 console_span_processor:48 telemetry: output: {'id': 'vs_dab05212-db05-402c-91ef-57e41797406b', 'object':
'vector_store', 'created_at': 1757540912, 'name': 'acme_docs', 'usage_bytes': 0, 'file_counts': {'completed': 3, 'cancelled': 0, 'failed': 0,
'in_progress': 0, 'total': 3}, 'status': 'completed', 'expires_after': None, 'expires_at': None, 'last_active_at': 1757540912, 'metadata':
{'provider_id': 'faiss', 'provider_vector_db_id': 'vs_dab05212-db05-402c-91ef-57e41797406b'}}
INFO 2025-09-10 14:49:10,047 console_span_processor:39 telemetry: 21:49:10.044 [END] /v1/openai/v1/vector_stores [StatusCode.OK] (37449.64ms)
INFO 2025-09-10 14:49:10,047 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/vector_stores
INFO 2025-09-10 14:49:10,048 console_span_processor:62 telemetry: 21:49:10.039 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/vector_stores
HTTP/1.1" 200
INFO 2025-09-10 14:49:10,126 console_span_processor:28 telemetry: 21:49:10.126 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:49:10,140 console_span_processor:39 telemetry: 21:49:10.132 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.72ms)
INFO 2025-09-10 14:49:10,142 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:10,155 console_span_processor:39 telemetry: 21:49:10.143 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.34ms)
INFO 2025-09-10 14:49:10,155 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:49:10,160 console_span_processor:39 telemetry: 21:49:10.157 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:49:10,161 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:10,258 console_span_processor:39 telemetry: 21:49:10.219 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (88.76ms)
INFO 2025-09-10 14:49:10,266 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:49:10,285 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:49:10,295 console_span_processor:39 telemetry: 21:49:10.292 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (161.80ms)
INFO 2025-09-10 14:49:10,296 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:49:10,304 console_span_processor:39 telemetry: 21:49:10.299 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (169.86ms)
INFO 2025-09-10 14:49:10,313 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}, {'file_id': '', 'filename': '', 'score': 0.7863530206684866, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:49:10,323 console_span_processor:39 telemetry: 21:49:10.318 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(188.52ms)
INFO 2025-09-10 14:49:10,324 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}, {'file_id': '', 'filename': '', 'score': 0.7863530206684866, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:49:10,329 console_span_processor:39 telemetry: 21:49:10.326 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (199.98ms)
INFO 2025-09-10 14:49:10,336 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:49:10,337 console_span_processor:62 telemetry: 21:49:10.290 [INFO] 127.0.0.1:56006 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:49:57,749 console_span_processor:28 telemetry: 21:49:57.749 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:49:57,758 console_span_processor:39 telemetry: 21:49:57.753 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:49:57,758 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:49:57,761 console_span_processor:39 telemetry: 21:49:57.760 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:49:57,762 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:49:57,766 console_span_processor:39 telemetry: 21:49:57.764 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.51ms)
INFO 2025-09-10 14:49:57,767 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
To disable this warning, you can either:
- Avoid using `tokenizers` before the fork if possible
- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
To disable this warning, you can either:
- Avoid using `tokenizers` before the fork if possible
- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
INFO 2025-09-10 14:50:01,673 console_span_processor:39 telemetry: 21:50:01.672 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (3908.76ms)
INFO 2025-09-10 14:50:01,675 console_span_processor:48 telemetry: output: {'id': 'oAit2Fa-62bZhn-97d2236c1b482510', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': "In the Andes' gentle breeze, a llama's soft eyes gaze with
peaceful ease, its fur a warm and fuzzy tease. With steps both gentle and serene, the llama roams, a symbol of calm, its beauty pure and
supreme.", 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed':
7075179338234292000}], 'created': 1757540999, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 50, 'prompt_tokens': 50, 'total_tokens': 100,
'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 0}, 'prompt': []}
INFO 2025-09-10 14:50:01,687 uvicorn.access:473 uncategorized: ::1:56392 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:50:01,692 console_span_processor:39 telemetry: 21:50:01.688 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(3936.71ms)
INFO 2025-09-10 14:50:01,692 console_span_processor:48 telemetry: output: {'id': 'oAit2Fa-62bZhn-97d2236c1b482510', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': "In the Andes' gentle breeze, a llama's soft eyes gaze with
peaceful ease, its fur a warm and fuzzy tease. With steps both gentle and serene, the llama roams, a symbol of calm, its beauty pure and
supreme.", 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed':
7075179338234292000}], 'created': 1757540999, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 50, 'prompt_tokens': 50, 'total_tokens': 100,
'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 0}, 'prompt': [], 'metrics': [{'trace_id':
'b7f7481d23ea1b2d4b89111888ebe8b3', 'span_id': '60cf33fa222feaf3', 'timestamp': '2025-09-10T21:50:01.687118Z', 'attributes': {'model_id':
'together/me...
INFO 2025-09-10 14:50:01,694 console_span_processor:62 telemetry: 21:50:01.687 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:50:01,695 console_span_processor:67 telemetry: value: 50
INFO 2025-09-10 14:50:01,695 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:50:01,696 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:50:01,696 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:50:01,698 console_span_processor:62 telemetry: 21:50:01.687 [INFO] metric.completion_tokens
INFO 2025-09-10 14:50:01,699 console_span_processor:67 telemetry: value: 50
INFO 2025-09-10 14:50:01,699 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:50:01,700 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:50:01,701 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:50:01,719 console_span_processor:62 telemetry: 21:50:01.687 [INFO] metric.total_tokens
INFO 2025-09-10 14:50:01,723 console_span_processor:67 telemetry: value: 100
INFO 2025-09-10 14:50:01,725 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:50:01,730 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:50:01,733 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:50:01,746 console_span_processor:39 telemetry: 21:50:01.738 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (3989.18ms)
INFO 2025-09-10 14:50:01,747 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:50:01,748 console_span_processor:62 telemetry: 21:50:01.688 [INFO] ::1:56392 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:45,329 console_span_processor:28 telemetry: 21:51:45.329 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:45,371 console_span_processor:39 telemetry: 21:51:45.337 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.30ms)
INFO 2025-09-10 14:51:45,375 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:45,408 console_span_processor:39 telemetry: 21:51:45.377 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:51:45,408 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:45,415 console_span_processor:39 telemetry: 21:51:45.410 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.56ms)
INFO 2025-09-10 14:51:45,415 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:46,425 console_span_processor:39 telemetry: 21:51:46.414 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (1005.10ms)
INFO 2025-09-10 14:51:46,426 console_span_processor:48 telemetry: output: {'id': 'oAitZwc-62bZhn-97d22606494cfa1a', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed':
15009310705663400000}], 'created': 1757541105, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 633,...
INFO 2025-09-10 14:51:46,443 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:46,457 console_span_processor:39 telemetry: 21:51:46.444 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(1106.92ms)
INFO 2025-09-10 14:51:46,458 console_span_processor:48 telemetry: output: {'id': 'oAitZwc-62bZhn-97d22606494cfa1a', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed':
15009310705663400000}], 'created': 1757541105, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 63...
INFO 2025-09-10 14:51:46,459 console_span_processor:62 telemetry: 21:51:46.442 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:46,459 console_span_processor:67 telemetry: value: 495
INFO 2025-09-10 14:51:46,460 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:46,460 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:46,461 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:46,461 console_span_processor:62 telemetry: 21:51:46.442 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:46,462 console_span_processor:67 telemetry: value: 138
INFO 2025-09-10 14:51:46,463 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:46,463 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:46,463 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:46,464 console_span_processor:62 telemetry: 21:51:46.442 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:46,466 console_span_processor:67 telemetry: value: 633
INFO 2025-09-10 14:51:46,466 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:46,467 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:46,467 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:46,522 console_span_processor:39 telemetry: 21:51:46.468 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (1138.88ms)
INFO 2025-09-10 14:51:46,530 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:46,531 console_span_processor:62 telemetry: 21:51:46.443 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:46,532 console_span_processor:28 telemetry: 21:51:46.532 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:46,544 console_span_processor:39 telemetry: 21:51:46.534 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:51:46,544 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:46,551 console_span_processor:39 telemetry: 21:51:46.547 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.27ms)
INFO 2025-09-10 14:51:46,553 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:46,558 console_span_processor:39 telemetry: 21:51:46.556 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.51ms)
INFO 2025-09-10 14:51:46,559 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,003 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,004 console_span_processor:39 telemetry: 21:51:46.991 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (457.59ms)
INFO 2025-09-10 14:51:47,005 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,025 console_span_processor:39 telemetry: 21:51:47.008 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (474.21ms)
INFO 2025-09-10 14:51:47,028 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,038 console_span_processor:39 telemetry: 21:51:47.034 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (500.67ms)
INFO 2025-09-10 14:51:47,040 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,051 console_span_processor:39 telemetry: 21:51:47.043 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(510.32ms)
INFO 2025-09-10 14:51:47,052 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,059 console_span_processor:39 telemetry: 21:51:47.055 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (522.95ms)
INFO 2025-09-10 14:51:47,061 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,063 console_span_processor:62 telemetry: 21:51:47.004 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,066 console_span_processor:28 telemetry: 21:51:47.066 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,072 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,106 console_span_processor:39 telemetry: 21:51:47.086 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.59ms)
INFO 2025-09-10 14:51:47,107 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,121 console_span_processor:39 telemetry: 21:51:47.118 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.85ms)
INFO 2025-09-10 14:51:47,122 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,134 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,141 console_span_processor:39 telemetry: 21:51:47.124 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.22ms)
INFO 2025-09-10 14:51:47,141 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,154 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,155 console_span_processor:39 telemetry: 21:51:47.143 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (57.86ms)
INFO 2025-09-10 14:51:47,156 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,169 console_span_processor:39 telemetry: 21:51:47.159 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (75.34ms)
INFO 2025-09-10 14:51:47,170 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,185 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,204 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,205 console_span_processor:39 telemetry: 21:51:47.173 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (89.84ms)
INFO 2025-09-10 14:51:47,206 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,220 console_span_processor:39 telemetry: 21:51:47.208 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(128.68ms)
INFO 2025-09-10 14:51:47,221 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,236 console_span_processor:39 telemetry: 21:51:47.223 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (157.17ms)
INFO 2025-09-10 14:51:47,237 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,238 console_span_processor:62 telemetry: 21:51:47.074 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,239 console_span_processor:28 telemetry: 21:51:47.239 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,243 console_span_processor:39 telemetry: 21:51:47.241 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:47,244 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,271 console_span_processor:39 telemetry: 21:51:47.249 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (1.66ms)
INFO 2025-09-10 14:51:47,272 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,275 console_span_processor:39 telemetry: 21:51:47.273 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.23ms)
INFO 2025-09-10 14:51:47,275 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,281 console_span_processor:39 telemetry: 21:51:47.276 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (35.50ms)
INFO 2025-09-10 14:51:47,281 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,294 console_span_processor:39 telemetry: 21:51:47.283 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (42.27ms)
INFO 2025-09-10 14:51:47,295 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,298 console_span_processor:39 telemetry: 21:51:47.297 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (56.25ms)
INFO 2025-09-10 14:51:47,299 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,301 console_span_processor:39 telemetry: 21:51:47.300 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(60.15ms)
INFO 2025-09-10 14:51:47,302 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,306 console_span_processor:39 telemetry: 21:51:47.303 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (64.16ms)
INFO 2025-09-10 14:51:47,307 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,307 console_span_processor:62 telemetry: 21:51:47.135 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,308 console_span_processor:28 telemetry: 21:51:47.308 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,316 console_span_processor:39 telemetry: 21:51:47.310 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.14ms)
INFO 2025-09-10 14:51:47,317 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,320 console_span_processor:39 telemetry: 21:51:47.319 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.37ms)
INFO 2025-09-10 14:51:47,321 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,324 console_span_processor:39 telemetry: 21:51:47.323 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:51:47,325 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,327 console_span_processor:39 telemetry: 21:51:47.326 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (16.35ms)
INFO 2025-09-10 14:51:47,327 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,330 console_span_processor:39 telemetry: 21:51:47.329 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (20.00ms)
INFO 2025-09-10 14:51:47,331 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,334 console_span_processor:39 telemetry: 21:51:47.333 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (23.86ms)
INFO 2025-09-10 14:51:47,335 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,338 console_span_processor:39 telemetry: 21:51:47.336 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(27.52ms)
INFO 2025-09-10 14:51:47,339 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,341 console_span_processor:39 telemetry: 21:51:47.340 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (32.36ms)
INFO 2025-09-10 14:51:47,342 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,343 console_span_processor:62 telemetry: 21:51:47.155 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,343 console_span_processor:28 telemetry: 21:51:47.343 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,348 console_span_processor:39 telemetry: 21:51:47.345 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:51:47,348 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,352 console_span_processor:39 telemetry: 21:51:47.350 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.46ms)
INFO 2025-09-10 14:51:47,353 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,355 console_span_processor:39 telemetry: 21:51:47.354 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:47,356 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,358 console_span_processor:39 telemetry: 21:51:47.356 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (11.96ms)
INFO 2025-09-10 14:51:47,358 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,363 console_span_processor:39 telemetry: 21:51:47.360 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (15.81ms)
INFO 2025-09-10 14:51:47,363 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,367 console_span_processor:39 telemetry: 21:51:47.365 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (20.64ms)
INFO 2025-09-10 14:51:47,368 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,371 console_span_processor:39 telemetry: 21:51:47.369 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(25.18ms)
INFO 2025-09-10 14:51:47,371 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,376 console_span_processor:39 telemetry: 21:51:47.373 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (29.29ms)
INFO 2025-09-10 14:51:47,376 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,377 console_span_processor:62 telemetry: 21:51:47.185 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,378 console_span_processor:28 telemetry: 21:51:47.378 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,389 console_span_processor:39 telemetry: 21:51:47.379 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.14ms)
INFO 2025-09-10 14:51:47,390 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,393 console_span_processor:39 telemetry: 21:51:47.391 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:47,394 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,403 console_span_processor:39 telemetry: 21:51:47.395 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:47,404 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,407 console_span_processor:39 telemetry: 21:51:47.405 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (26.41ms)
INFO 2025-09-10 14:51:47,408 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,411 console_span_processor:39 telemetry: 21:51:47.409 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (30.37ms)
INFO 2025-09-10 14:51:47,412 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,421 console_span_processor:39 telemetry: 21:51:47.413 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (34.69ms)
INFO 2025-09-10 14:51:47,422 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,427 console_span_processor:39 telemetry: 21:51:47.423 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(44.73ms)
INFO 2025-09-10 14:51:47,427 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,431 console_span_processor:39 telemetry: 21:51:47.429 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (50.76ms)
INFO 2025-09-10 14:51:47,432 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,432 console_span_processor:62 telemetry: 21:51:47.205 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,433 console_span_processor:28 telemetry: 21:51:47.433 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:47,443 console_span_processor:39 telemetry: 21:51:47.435 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:47,444 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:47,454 console_span_processor:39 telemetry: 21:51:47.445 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:47,455 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:47,458 console_span_processor:39 telemetry: 21:51:47.456 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:47,459 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:48,137 console_span_processor:39 telemetry: 21:51:48.128 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (672.06ms)
INFO 2025-09-10 14:51:48,138 console_span_processor:48 telemetry: output: {'id': 'oAitaWe-62bZhn-97d22611ebfb168e', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None,
'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed': 12110905932316877000}], 'created':
1757541107, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint':
None, 'usage': {'completion_tokens': 131, 'prompt_tokens': 998, 'total_tokens': 1129, 'completion_tokens_d...
INFO 2025-09-10 14:51:48,140 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:48,152 console_span_processor:39 telemetry: 21:51:48.141 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(706.73ms)
INFO 2025-09-10 14:51:48,153 console_span_processor:48 telemetry: output: {'id': 'oAitaWe-62bZhn-97d22611ebfb168e', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None,
'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed': 12110905932316877000}],
'created': 1757541107, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None,
'system_fingerprint': None, 'usage': {'completion_tokens': 131, 'prompt_tokens': 998, 'total_tokens': 1129, 'completion_tokens...
INFO 2025-09-10 14:51:48,154 console_span_processor:62 telemetry: 21:51:48.140 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:48,155 console_span_processor:67 telemetry: value: 998
INFO 2025-09-10 14:51:48,155 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:48,156 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:48,156 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:48,157 console_span_processor:62 telemetry: 21:51:48.140 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:48,157 console_span_processor:67 telemetry: value: 131
INFO 2025-09-10 14:51:48,158 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:48,158 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:48,159 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:48,159 console_span_processor:62 telemetry: 21:51:48.140 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:48,160 console_span_processor:67 telemetry: value: 1129
INFO 2025-09-10 14:51:48,160 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:48,160 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:48,161 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:48,170 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,182 console_span_processor:39 telemetry: 21:51:48.162 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (728.49ms)
INFO 2025-09-10 14:51:48,183 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:48,183 console_span_processor:62 telemetry: 21:51:48.141 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:48,184 console_span_processor:28 telemetry: 21:51:48.184 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,189 console_span_processor:39 telemetry: 21:51:48.187 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.65ms)
INFO 2025-09-10 14:51:48,190 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,198 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,199 console_span_processor:39 telemetry: 21:51:48.191 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.29ms)
INFO 2025-09-10 14:51:48,201 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,211 console_span_processor:39 telemetry: 21:51:48.204 [END] ModelsRoutingTable.get_model [StatusCode.OK] (1.00ms)
INFO 2025-09-10 14:51:48,213 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,217 console_span_processor:39 telemetry: 21:51:48.215 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (28.70ms)
INFO 2025-09-10 14:51:48,218 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,226 console_span_processor:39 telemetry: 21:51:48.221 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (35.89ms)
INFO 2025-09-10 14:51:48,227 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,235 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,239 console_span_processor:39 telemetry: 21:51:48.229 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (44.29ms)
INFO 2025-09-10 14:51:48,241 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,252 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,252 console_span_processor:39 telemetry: 21:51:48.242 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(57.30ms)
INFO 2025-09-10 14:51:48,253 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,265 console_span_processor:39 telemetry: 21:51:48.255 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (70.68ms)
INFO 2025-09-10 14:51:48,266 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,267 console_span_processor:62 telemetry: 21:51:48.171 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,268 console_span_processor:28 telemetry: 21:51:48.268 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,271 console_span_processor:39 telemetry: 21:51:48.270 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:48,272 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,275 console_span_processor:39 telemetry: 21:51:48.273 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:48,276 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,280 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,283 console_span_processor:39 telemetry: 21:51:48.277 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,284 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,294 console_span_processor:39 telemetry: 21:51:48.287 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (18.00ms)
INFO 2025-09-10 14:51:48,294 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,298 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,307 console_span_processor:39 telemetry: 21:51:48.296 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (27.38ms)
INFO 2025-09-10 14:51:48,308 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,330 console_span_processor:39 telemetry: 21:51:48.309 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (40.46ms)
INFO 2025-09-10 14:51:48,331 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,334 console_span_processor:39 telemetry: 21:51:48.332 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(63.81ms)
INFO 2025-09-10 14:51:48,334 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,359 console_span_processor:39 telemetry: 21:51:48.336 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (67.91ms)
INFO 2025-09-10 14:51:48,360 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,360 console_span_processor:62 telemetry: 21:51:48.199 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,361 console_span_processor:28 telemetry: 21:51:48.361 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,364 console_span_processor:39 telemetry: 21:51:48.363 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:51:48,365 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,369 console_span_processor:39 telemetry: 21:51:48.367 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,369 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,373 console_span_processor:39 telemetry: 21:51:48.371 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.32ms)
INFO 2025-09-10 14:51:48,374 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,377 console_span_processor:39 telemetry: 21:51:48.375 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (12.40ms)
INFO 2025-09-10 14:51:48,378 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,383 console_span_processor:39 telemetry: 21:51:48.379 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (16.82ms)
INFO 2025-09-10 14:51:48,383 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,395 console_span_processor:39 telemetry: 21:51:48.385 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (22.60ms)
INFO 2025-09-10 14:51:48,396 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,409 console_span_processor:39 telemetry: 21:51:48.397 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(35.03ms)
INFO 2025-09-10 14:51:48,414 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,429 console_span_processor:39 telemetry: 21:51:48.418 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (57.22ms)
INFO 2025-09-10 14:51:48,432 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,433 console_span_processor:62 telemetry: 21:51:48.235 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,435 console_span_processor:28 telemetry: 21:51:48.435 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,449 console_span_processor:39 telemetry: 21:51:48.438 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:48,449 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,464 console_span_processor:39 telemetry: 21:51:48.451 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.28ms)
INFO 2025-09-10 14:51:48,465 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,472 console_span_processor:39 telemetry: 21:51:48.467 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:48,473 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,477 console_span_processor:39 telemetry: 21:51:48.475 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (37.21ms)
INFO 2025-09-10 14:51:48,478 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,482 console_span_processor:39 telemetry: 21:51:48.480 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (42.48ms)
INFO 2025-09-10 14:51:48,483 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,486 console_span_processor:39 telemetry: 21:51:48.485 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (47.47ms)
INFO 2025-09-10 14:51:48,487 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,492 console_span_processor:39 telemetry: 21:51:48.488 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(51.57ms)
INFO 2025-09-10 14:51:48,492 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,501 console_span_processor:39 telemetry: 21:51:48.494 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (58.89ms)
INFO 2025-09-10 14:51:48,502 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,503 console_span_processor:62 telemetry: 21:51:48.252 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,504 console_span_processor:28 telemetry: 21:51:48.504 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,511 console_span_processor:39 telemetry: 21:51:48.505 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:48,511 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,518 console_span_processor:39 telemetry: 21:51:48.512 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:48,519 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,546 console_span_processor:39 telemetry: 21:51:48.521 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.38ms)
INFO 2025-09-10 14:51:48,547 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,557 console_span_processor:39 telemetry: 21:51:48.550 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (44.66ms)
INFO 2025-09-10 14:51:48,558 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,563 console_span_processor:39 telemetry: 21:51:48.559 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (54.51ms)
INFO 2025-09-10 14:51:48,564 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,570 console_span_processor:39 telemetry: 21:51:48.565 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (60.37ms)
INFO 2025-09-10 14:51:48,571 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,573 console_span_processor:39 telemetry: 21:51:48.572 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(67.76ms)
INFO 2025-09-10 14:51:48,574 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,577 console_span_processor:39 telemetry: 21:51:48.575 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (71.71ms)
INFO 2025-09-10 14:51:48,577 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,578 console_span_processor:62 telemetry: 21:51:48.280 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,579 console_span_processor:28 telemetry: 21:51:48.579 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,587 console_span_processor:39 telemetry: 21:51:48.582 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.48ms)
INFO 2025-09-10 14:51:48,588 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,592 console_span_processor:39 telemetry: 21:51:48.589 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:48,592 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,601 console_span_processor:39 telemetry: 21:51:48.594 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,602 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,605 console_span_processor:39 telemetry: 21:51:48.603 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (21.97ms)
INFO 2025-09-10 14:51:48,606 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,609 console_span_processor:39 telemetry: 21:51:48.607 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (26.56ms)
INFO 2025-09-10 14:51:48,609 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,614 console_span_processor:39 telemetry: 21:51:48.612 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (31.13ms)
INFO 2025-09-10 14:51:48,615 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,626 console_span_processor:39 telemetry: 21:51:48.616 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(35.85ms)
INFO 2025-09-10 14:51:48,627 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,635 console_span_processor:39 telemetry: 21:51:48.632 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (52.29ms)
INFO 2025-09-10 14:51:48,636 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,636 console_span_processor:62 telemetry: 21:51:48.299 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,637 console_span_processor:28 telemetry: 21:51:48.637 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:48,640 console_span_processor:39 telemetry: 21:51:48.638 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:48,641 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:48,643 console_span_processor:39 telemetry: 21:51:48.642 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,643 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:48,653 console_span_processor:39 telemetry: 21:51:48.645 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.14ms)
INFO 2025-09-10 14:51:48,653 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:53,149 console_span_processor:39 telemetry: 21:51:53.146 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (4501.83ms)
INFO 2025-09-10 14:51:53,150 console_span_processor:48 telemetry: output: {'id': 'oAitaoX-4YNCb4-97d22618bd651584', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I should try to use the Llama Stack Vector Store
RAG tool again with a different input to see if I can get a relevant result.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input:
{"query": "shipping time", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None, 'role': 'assistant',
'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed': 7090030016801882000}], 'created': 1757541108, 'model':
'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage':
{'completion_tokens': 89, 'prompt_tokens': 1494, 'total_tokens': 1583, 'completion_tokens_details': None, 'prompt_tokens_details': None,
'cached_tokens': 0}, 'prompt': []}
INFO 2025-09-10 14:51:53,153 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:53,157 console_span_processor:39 telemetry: 21:51:53.153 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(4515.32ms)
INFO 2025-09-10 14:51:53,158 console_span_processor:48 telemetry: output: {'id': 'oAitaoX-4YNCb4-97d22618bd651584', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I should try to use the Llama Stack Vector Store
RAG tool again with a different input to see if I can get a relevant result.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input:
{"query": "shipping time", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None, 'role': 'assistant',
'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed': 7090030016801882000}], 'created': 1757541108,
'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage':
{'completion_tokens': 89, 'prompt_tokens': 1494, 'total_tokens': 1583, 'completion_tokens_details': None, 'prompt_tokens_details': None,
'cached_tokens': 0}, 'prompt': [], 'metrics': [{'trace_id': 'dd10581530aada6b43c22d2c221fafe0', 'span_id': 'ba2f798e...
INFO 2025-09-10 14:51:53,159 console_span_processor:62 telemetry: 21:51:53.152 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:53,160 console_span_processor:67 telemetry: value: 1494
INFO 2025-09-10 14:51:53,160 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:53,160 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:53,161 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:53,161 console_span_processor:62 telemetry: 21:51:53.152 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:53,162 console_span_processor:67 telemetry: value: 89
INFO 2025-09-10 14:51:53,162 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:53,163 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:53,165 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:53,166 console_span_processor:62 telemetry: 21:51:53.152 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:53,166 console_span_processor:67 telemetry: value: 1583
INFO 2025-09-10 14:51:53,167 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:53,167 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:53,167 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:53,183 console_span_processor:39 telemetry: 21:51:53.169 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (4532.11ms)
INFO 2025-09-10 14:51:53,184 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:53,184 console_span_processor:62 telemetry: 21:51:53.153 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:53,185 console_span_processor:28 telemetry: 21:51:53.185 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:53,212 console_span_processor:39 telemetry: 21:51:53.187 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:53,213 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:53,232 console_span_processor:39 telemetry: 21:51:53.214 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.34ms)
INFO 2025-09-10 14:51:53,233 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:53,245 console_span_processor:39 telemetry: 21:51:53.234 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:51:53,246 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,285 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,305 console_span_processor:39 telemetry: 21:51:54.289 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (1102.92ms)
INFO 2025-09-10 14:51:54,306 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,318 console_span_processor:39 telemetry: 21:51:54.308 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (1121.71ms)
INFO 2025-09-10 14:51:54,319 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,322 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,342 console_span_processor:39 telemetry: 21:51:54.324 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (1137.83ms)
INFO 2025-09-10 14:51:54,342 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,351 console_span_processor:39 telemetry: 21:51:54.344 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(1157.96ms)
INFO 2025-09-10 14:51:54,353 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,353 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,360 console_span_processor:39 telemetry: 21:51:54.355 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (1170.42ms)
INFO 2025-09-10 14:51:54,360 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,361 console_span_processor:62 telemetry: 21:51:54.293 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,362 console_span_processor:28 telemetry: 21:51:54.362 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,366 console_span_processor:39 telemetry: 21:51:54.364 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:54,367 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,373 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,380 console_span_processor:39 telemetry: 21:51:54.369 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.28ms)
INFO 2025-09-10 14:51:54,381 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,389 console_span_processor:39 telemetry: 21:51:54.386 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:51:54,390 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,393 console_span_processor:39 telemetry: 21:51:54.391 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (26.85ms)
INFO 2025-09-10 14:51:54,394 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,425 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,438 console_span_processor:39 telemetry: 21:51:54.411 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (47.55ms)
INFO 2025-09-10 14:51:54,440 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,445 console_span_processor:39 telemetry: 21:51:54.442 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (78.94ms)
INFO 2025-09-10 14:51:54,446 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,457 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,457 console_span_processor:39 telemetry: 21:51:54.452 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(89.01ms)
INFO 2025-09-10 14:51:54,459 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,468 console_span_processor:39 telemetry: 21:51:54.463 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (100.62ms)
INFO 2025-09-10 14:51:54,469 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,469 console_span_processor:62 telemetry: 21:51:54.323 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,471 console_span_processor:28 telemetry: 21:51:54.471 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,489 console_span_processor:39 telemetry: 21:51:54.474 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:51:54,490 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,502 console_span_processor:39 telemetry: 21:51:54.495 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (2.67ms)
INFO 2025-09-10 14:51:54,504 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,524 console_span_processor:39 telemetry: 21:51:54.514 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.79ms)
INFO 2025-09-10 14:51:54,526 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,529 console_span_processor:39 telemetry: 21:51:54.527 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (53.95ms)
INFO 2025-09-10 14:51:54,537 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,550 console_span_processor:39 telemetry: 21:51:54.542 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (68.87ms)
INFO 2025-09-10 14:51:54,551 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,557 console_span_processor:39 telemetry: 21:51:54.554 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (81.34ms)
INFO 2025-09-10 14:51:54,559 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,573 console_span_processor:39 telemetry: 21:51:54.564 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(91.94ms)
INFO 2025-09-10 14:51:54,574 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,583 console_span_processor:39 telemetry: 21:51:54.575 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (104.63ms)
INFO 2025-09-10 14:51:54,584 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,584 console_span_processor:62 telemetry: 21:51:54.354 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,585 console_span_processor:28 telemetry: 21:51:54.585 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,591 console_span_processor:39 telemetry: 21:51:54.589 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:54,591 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,594 console_span_processor:39 telemetry: 21:51:54.592 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:54,595 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,599 console_span_processor:39 telemetry: 21:51:54.596 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:54,599 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,604 console_span_processor:39 telemetry: 21:51:54.602 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (13.16ms)
INFO 2025-09-10 14:51:54,605 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,627 console_span_processor:39 telemetry: 21:51:54.621 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (32.66ms)
INFO 2025-09-10 14:51:54,634 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,643 console_span_processor:39 telemetry: 21:51:54.637 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (49.21ms)
INFO 2025-09-10 14:51:54,644 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,654 console_span_processor:39 telemetry: 21:51:54.646 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(57.62ms)
INFO 2025-09-10 14:51:54,656 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,664 console_span_processor:39 telemetry: 21:51:54.657 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (72.19ms)
INFO 2025-09-10 14:51:54,666 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,670 console_span_processor:62 telemetry: 21:51:54.374 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,673 console_span_processor:28 telemetry: 21:51:54.673 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,687 console_span_processor:39 telemetry: 21:51:54.678 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.38ms)
INFO 2025-09-10 14:51:54,688 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,697 console_span_processor:39 telemetry: 21:51:54.691 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:51:54,698 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,701 console_span_processor:39 telemetry: 21:51:54.699 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:54,704 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,716 console_span_processor:39 telemetry: 21:51:54.706 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (29.72ms)
INFO 2025-09-10 14:51:54,718 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,724 console_span_processor:39 telemetry: 21:51:54.721 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (45.99ms)
INFO 2025-09-10 14:51:54,724 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,727 console_span_processor:39 telemetry: 21:51:54.726 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (51.80ms)
INFO 2025-09-10 14:51:54,728 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,732 console_span_processor:39 telemetry: 21:51:54.730 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(56.53ms)
INFO 2025-09-10 14:51:54,732 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,735 console_span_processor:39 telemetry: 21:51:54.734 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (60.83ms)
INFO 2025-09-10 14:51:54,736 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,736 console_span_processor:62 telemetry: 21:51:54.426 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,737 console_span_processor:28 telemetry: 21:51:54.737 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,747 console_span_processor:39 telemetry: 21:51:54.740 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:54,748 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,752 console_span_processor:39 telemetry: 21:51:54.750 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.22ms)
INFO 2025-09-10 14:51:54,752 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,755 console_span_processor:39 telemetry: 21:51:54.754 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.32ms)
INFO 2025-09-10 14:51:54,756 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,758 console_span_processor:39 telemetry: 21:51:54.756 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (17.05ms)
INFO 2025-09-10 14:51:54,761 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,767 console_span_processor:39 telemetry: 21:51:54.762 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (23.20ms)
INFO 2025-09-10 14:51:54,767 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,772 console_span_processor:39 telemetry: 21:51:54.769 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (30.01ms)
INFO 2025-09-10 14:51:54,773 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,775 console_span_processor:39 telemetry: 21:51:54.774 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(35.79ms)
INFO 2025-09-10 14:51:54,776 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,778 console_span_processor:39 telemetry: 21:51:54.777 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (40.35ms)
INFO 2025-09-10 14:51:54,779 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,779 console_span_processor:62 telemetry: 21:51:54.457 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,781 console_span_processor:28 telemetry: 21:51:54.781 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:54,790 console_span_processor:39 telemetry: 21:51:54.786 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.82ms)
INFO 2025-09-10 14:51:54,790 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:54,794 console_span_processor:39 telemetry: 21:51:54.792 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:54,794 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:54,798 console_span_processor:39 telemetry: 21:51:54.796 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:51:54,798 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:57,872 console_span_processor:39 telemetry: 21:51:57.868 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (3072.99ms)
INFO 2025-09-10 14:51:57,872 console_span_processor:48 telemetry: output: {'id': 'oAitcfB-4YNCb4-97d2263f6ff7cfe9', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: Since I couldn\'t get a relevant result from the
Llama Stack Vector Store RAG tool, I will provide a general answer to the question "How long does shipping take?".\n\nThe shipping time can
vary depending on the destination, shipping method, and other factors. Typically, shipping times can range from a few days to several weeks
or even months. Here are some general guidelines:\n\n* Domestic shipping: 1-7 business days\n* International shipping: 7-21 business days or
more\n* Express shipping: 1-3 business days\n* Standard shipping: 3-7 business days\n\nPlease note that these are general estimates and the
actual shipping time may vary depending on the specific circumstances.\n\nThought: I now can give a great answer\nFinal Answer: The shipping
time can vary depending on the destination, shipping method, and other factors. Typically, shipping tim...
INFO 2025-09-10 14:51:57,875 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:57,877 console_span_processor:39 telemetry: 21:51:57.876 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(3091.29ms)
INFO 2025-09-10 14:51:57,878 console_span_processor:48 telemetry: output: {'id': 'oAitcfB-4YNCb4-97d2263f6ff7cfe9', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: Since I couldn\'t get a relevant result from the
Llama Stack Vector Store RAG tool, I will provide a general answer to the question "How long does shipping take?".\n\nThe shipping time can
vary depending on the destination, shipping method, and other factors. Typically, shipping times can range from a few days to several weeks
or even months. Here are some general guidelines:\n\n* Domestic shipping: 1-7 business days\n* International shipping: 7-21 business days or
more\n* Express shipping: 1-3 business days\n* Standard shipping: 3-7 business days\n\nPlease note that these are general estimates and the
actual shipping time may vary depending on the specific circumstances.\n\nThought: I now can give a great answer\nFinal Answer: The shipping
time can vary depending on the destination, shipping method, and other factors. Typically, shipping tim...
INFO 2025-09-10 14:51:57,880 console_span_processor:62 telemetry: 21:51:57.874 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:57,880 console_span_processor:67 telemetry: value: 1948
INFO 2025-09-10 14:51:57,881 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:57,881 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:57,881 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:57,882 console_span_processor:62 telemetry: 21:51:57.874 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:57,882 console_span_processor:67 telemetry: value: 264
INFO 2025-09-10 14:51:57,882 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:57,883 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:57,883 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:57,884 console_span_processor:62 telemetry: 21:51:57.874 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:57,884 console_span_processor:67 telemetry: value: 2212
INFO 2025-09-10 14:51:57,884 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:57,885 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:57,886 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:57,890 console_span_processor:39 telemetry: 21:51:57.887 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (3106.16ms)
INFO 2025-09-10 14:51:57,891 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:57,891 console_span_processor:62 telemetry: 21:51:57.875 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:09,448 console_span_processor:28 telemetry: 21:55:09.448 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:09,463 console_span_processor:39 telemetry: 21:55:09.453 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:55:09,465 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:09,478 console_span_processor:39 telemetry: 21:55:09.467 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:55:09,479 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:09,483 console_span_processor:39 telemetry: 21:55:09.480 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:55:09,484 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:11,246 console_span_processor:39 telemetry: 21:55:11.242 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (1762.00ms)
INFO 2025-09-10 14:55:11,247 console_span_processor:48 telemetry: output: {'id': 'oAiuccr-62bZhn-97d22b0209009e58', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed':
3440355828201570300}], 'created': 1757541309, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 633, ...
INFO 2025-09-10 14:55:11,249 uvicorn.access:473 uncategorized: ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:11,259 console_span_processor:39 telemetry: 21:55:11.250 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(1797.12ms)
INFO 2025-09-10 14:55:11,260 console_span_processor:48 telemetry: output: {'id': 'oAiuccr-62bZhn-97d22b0209009e58', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed':
3440355828201570300}], 'created': 1757541309, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 633...
INFO 2025-09-10 14:55:11,261 console_span_processor:62 telemetry: 21:55:11.248 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:11,261 console_span_processor:67 telemetry: value: 495
INFO 2025-09-10 14:55:11,262 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:11,262 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:11,263 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:11,263 console_span_processor:62 telemetry: 21:55:11.249 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:11,264 console_span_processor:67 telemetry: value: 138
INFO 2025-09-10 14:55:11,264 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:11,265 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:11,265 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:11,265 console_span_processor:62 telemetry: 21:55:11.249 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:11,266 console_span_processor:67 telemetry: value: 633
INFO 2025-09-10 14:55:11,266 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:11,266 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:11,267 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:11,284 console_span_processor:39 telemetry: 21:55:11.268 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (1819.72ms)
INFO 2025-09-10 14:55:11,285 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:11,287 console_span_processor:62 telemetry: 21:55:11.250 [INFO] ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:11,289 console_span_processor:28 telemetry: 21:55:11.289 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:55:11,316 console_span_processor:39 telemetry: 21:55:11.306 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.72ms)
INFO 2025-09-10 14:55:11,317 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:11,325 console_span_processor:39 telemetry: 21:55:11.319 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.33ms)
INFO 2025-09-10 14:55:11,326 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:55:11,337 console_span_processor:39 telemetry: 21:55:11.328 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:55:11,339 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:11,725 uvicorn.access:473 uncategorized: 127.0.0.1:57863 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:11,816 console_span_processor:39 telemetry: 21:55:11.712 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (407.13ms)
INFO 2025-09-10 14:55:11,817 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:55:11,821 console_span_processor:39 telemetry: 21:55:11.818 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (515.05ms)
INFO 2025-09-10 14:55:11,822 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:55:11,831 console_span_processor:39 telemetry: 21:55:11.824 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (524.43ms)
INFO 2025-09-10 14:55:11,832 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:11,837 console_span_processor:39 telemetry: 21:55:11.834 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(535.84ms)
INFO 2025-09-10 14:55:11,838 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:11,843 console_span_processor:39 telemetry: 21:55:11.840 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (550.67ms)
INFO 2025-09-10 14:55:11,844 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:55:11,844 console_span_processor:62 telemetry: 21:55:11.728 [INFO] 127.0.0.1:57863 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:11,845 console_span_processor:28 telemetry: 21:55:11.845 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:11,848 console_span_processor:39 telemetry: 21:55:11.846 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:55:11,849 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:11,866 console_span_processor:39 telemetry: 21:55:11.850 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.33ms)
INFO 2025-09-10 14:55:11,866 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:11,893 console_span_processor:39 telemetry: 21:55:11.868 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:55:11,894 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:12,290 console_span_processor:39 telemetry: 21:55:12.288 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (421.30ms)
INFO 2025-09-10 14:55:12,291 console_span_processor:48 telemetry: output: {'id': 'oAiudJu-62bZhn-97d22b1098a9ed39', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Acme
ships globally in 3-5 business days.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': []}, 'seed': 9970525031584217000}], 'created': 1757541312, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 25, 'prompt_tokens': 655, 'total_tokens':
680, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 512}, 'prompt': []}
INFO 2025-09-10 14:55:12,297 uvicorn.access:473 uncategorized: ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:12,324 console_span_processor:39 telemetry: 21:55:12.298 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(451.81ms)
INFO 2025-09-10 14:55:12,326 console_span_processor:48 telemetry: output: {'id': 'oAiudJu-62bZhn-97d22b1098a9ed39', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Acme
ships globally in 3-5 business days.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': None}, 'seed': 9970525031584217000}], 'created': 1757541312, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 25, 'prompt_tokens': 655, 'total_tokens':
680, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 512}, 'prompt': [], 'metrics': [{'trace_id':
'b0fe401af1dce917b7278f7a651b67bc', 'span_id': '7130a92e6a6a8fba', 'timestamp': '2025-09-10T21:55:12.297305Z', 'attributes': {'model_id':
'together/meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together'}, 'type': 'metric', 'metric': 'prompt_toke...
INFO 2025-09-10 14:55:12,327 console_span_processor:62 telemetry: 21:55:12.297 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:12,328 console_span_processor:67 telemetry: value: 655
INFO 2025-09-10 14:55:12,328 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:12,329 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:12,329 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:12,329 console_span_processor:62 telemetry: 21:55:12.297 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:12,330 console_span_processor:67 telemetry: value: 25
INFO 2025-09-10 14:55:12,330 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:12,331 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:12,331 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:12,332 console_span_processor:62 telemetry: 21:55:12.297 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:12,332 console_span_processor:67 telemetry: value: 680
INFO 2025-09-10 14:55:12,332 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:12,333 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:12,333 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:12,353 console_span_processor:39 telemetry: 21:55:12.335 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (489.36ms)
INFO 2025-09-10 14:55:12,355 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:12,358 console_span_processor:62 telemetry: 21:55:12.298 [INFO] ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:19,314 console_span_processor:28 telemetry: 21:55:19.314 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:19,320 console_span_processor:39 telemetry: 21:55:19.316 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:55:19,322 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:19,325 console_span_processor:39 telemetry: 21:55:19.323 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:55:19,326 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:19,331 console_span_processor:39 telemetry: 21:55:19.327 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.23ms)
INFO 2025-09-10 14:55:19,332 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:21,608 console_span_processor:39 telemetry: 21:55:21.606 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (2279.25ms)
INFO 2025-09-10 14:55:21,610 console_span_processor:48 telemetry: output: {'id': 'oAiufav-4YNCb4-97d22b3f6cb27af2', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "Can I return a product
after 40 days?", I need to search the vector store to find relevant information about the return policy. I will use the Llama Stack Vector
Store RAG tool to search the provided vector store ID.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input: {"query": "return policy
after 40 days", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold": 0.5}', 'refusal': None, 'role':
'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed': 17340032880891308000}], 'created':
1757541319, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint':
None, 'usage': {'completion_tokens': 124, 'prompt_tokens': 499, 'total_tokens': 623, 'completion_tokens_details': No...
INFO 2025-09-10 14:55:21,611 uvicorn.access:473 uncategorized: ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:21,631 console_span_processor:39 telemetry: 21:55:21.612 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(2297.16ms)
INFO 2025-09-10 14:55:21,632 console_span_processor:48 telemetry: output: {'id': 'oAiufav-4YNCb4-97d22b3f6cb27af2', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "Can I return a product
after 40 days?", I need to search the vector store to find relevant information about the return policy. I will use the Llama Stack Vector
Store RAG tool to search the provided vector store ID.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input: {"query": "return policy
after 40 days", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold": 0.5}', 'refusal': None, 'role':
'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed': 17340032880891308000}], 'created':
1757541319, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint':
None, 'usage': {'completion_tokens': 124, 'prompt_tokens': 499, 'total_tokens': 623, 'completion_tokens_details': ...
INFO 2025-09-10 14:55:21,636 console_span_processor:62 telemetry: 21:55:21.611 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:21,637 console_span_processor:67 telemetry: value: 499
INFO 2025-09-10 14:55:21,638 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:21,638 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:21,639 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:21,639 console_span_processor:62 telemetry: 21:55:21.611 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:21,639 console_span_processor:67 telemetry: value: 124
INFO 2025-09-10 14:55:21,640 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:21,640 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:21,641 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:21,641 console_span_processor:62 telemetry: 21:55:21.611 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:21,641 console_span_processor:67 telemetry: value: 623
INFO 2025-09-10 14:55:21,642 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:21,642 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:21,642 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:21,648 console_span_processor:39 telemetry: 21:55:21.643 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (2329.06ms)
INFO 2025-09-10 14:55:21,649 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:21,650 console_span_processor:62 telemetry: 21:55:21.612 [INFO] ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:21,651 console_span_processor:28 telemetry: 21:55:21.651 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:55:21,674 console_span_processor:39 telemetry: 21:55:21.654 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:55:21,675 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:21,685 console_span_processor:39 telemetry: 21:55:21.678 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.70ms)
INFO 2025-09-10 14:55:21,687 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:55:21,692 console_span_processor:39 telemetry: 21:55:21.689 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.53ms)
INFO 2025-09-10 14:55:21,692 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:22,019 uvicorn.access:473 uncategorized: 127.0.0.1:57888 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:22,024 console_span_processor:39 telemetry: 21:55:22.017 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (363.31ms)
INFO 2025-09-10 14:55:22,025 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.0018892501248046756, 0.030758941546082497, 0.10938595235347748, 0.04589828848838806, 0.0006913804681971669, 0.014387426897883415,
-0.015357869677245617, -0.011600838042795658, -0.08975677192211151, 0.053308334201574326, 0.0744965448975563, 0.01633235439658165,
0.010754235088825226, 0.004617820493876934, 0.009704680182039738, -0.03412426635622978, -0.04056152328848839, -0.019626466557383537,
-0.08569952845573425, -0.043116409331560135, 0.025109080597758293, -0.03337268903851509, -0.06306783854961395, 0.021730247884988785,
0.01859521120786667, 0.0934692993760109, -0.02332254685461521, 0.03396535664796829, -0.04177931323647499, -0.011372999288141727,
0.015714162960648537, -0.04297734424471855, -0.06080453842878342, -0.05970568209886551, -0.013541588559746742, 0.04719769209623337,
-0.1263798028230667, -0.09081613272428513, -0.044160086661577225, 0.010452632792294025, -0.04007401689887047, 0.029781267046928406,
-0.03511...
INFO 2025-09-10 14:55:22,031 console_span_processor:39 telemetry: 21:55:22.027 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (373.68ms)
INFO 2025-09-10 14:55:22,032 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Returns are accepted within 30 days of
purchase.', 'metadata': {'document_id': 'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10, 'metadata_token_count': 1}, 'embedding':
[-0.050018310546875, 0.0007208543829619884, 0.048539839684963226, 0.013606906868517399, -0.006504438817501068, 0.004046895541250706,
-0.04984626919031143, -8.024782437132671e-05, -0.02159256860613823, 0.0015519573353230953, 0.10069309175014496, 0.04437215253710747,
-0.022335151210427284, -0.05230937898159027, -0.028983373194932938, -0.049531035125255585, 0.03074926696717739, -0.03056054376065731,
0.021489247679710388, 0.016868554055690765, -0.028984908014535904, -0.07053273916244507, -0.022961033508181572, -0.0717858299612999,
0.0674479678273201, 0.021412895992398262, -0.06054700165987015, 0.021910998970270157, -0.023192649707198143, -0.028992125764489174,
0.025179730728268623, -0.006338999141007662, -0.001874048844911158, 0.009305929765105247, 0.011422501876950264, 0.0376049801707...
INFO 2025-09-10 14:55:22,057 console_span_processor:39 telemetry: 21:55:22.037 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (384.28ms)
INFO 2025-09-10 14:55:22,058 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'return policy after 40 days', 'data': [{'file_id': '', 'filename': '', 'score': 1.3987585167097674, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:22,063 console_span_processor:39 telemetry: 21:55:22.060 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(407.47ms)
INFO 2025-09-10 14:55:22,064 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'return policy after 40 days', 'data': [{'file_id': '', 'filename': '', 'score': 1.3987585167097674, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:22,175 console_span_processor:39 telemetry: 21:55:22.096 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (444.58ms)
INFO 2025-09-10 14:55:22,176 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:55:22,178 console_span_processor:62 telemetry: 21:55:22.021 [INFO] 127.0.0.1:57888 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:22,186 console_span_processor:28 telemetry: 21:55:22.186 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:22,195 console_span_processor:39 telemetry: 21:55:22.188 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.30ms)
INFO 2025-09-10 14:55:22,196 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:22,218 console_span_processor:39 telemetry: 21:55:22.197 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:55:22,220 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:22,227 console_span_processor:39 telemetry: 21:55:22.224 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:55:22,228 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:22,805 console_span_processor:39 telemetry: 21:55:22.801 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (577.41ms)
INFO 2025-09-10 14:55:22,806 console_span_processor:48 telemetry: output: {'id': 'oAiugR1-62bZhn-97d22b51096017f0', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Returns
are accepted within 30 days of purchase.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': []}, 'seed': 2982499907717596700}], 'created': 1757541322, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 23, 'prompt_tokens': 643, 'total_tokens':
666, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 256}, 'prompt': []}
INFO 2025-09-10 14:55:22,834 uvicorn.access:473 uncategorized: ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:22,873 console_span_processor:39 telemetry: 21:55:22.836 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(648.69ms)
INFO 2025-09-10 14:55:22,874 console_span_processor:48 telemetry: output: {'id': 'oAiugR1-62bZhn-97d22b51096017f0', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Returns
are accepted within 30 days of purchase.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': None}, 'seed': 2982499907717596700}], 'created': 1757541322, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 23, 'prompt_tokens': 643, 'total_tokens':
666, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 256}, 'prompt': [], 'metrics': [{'trace_id':
'd588c782bd804c0cb49e43ac8c028e7a', 'span_id': '396bc114a416fc6c', 'timestamp': '2025-09-10T21:55:22.832220Z', 'attributes': {'model_id':
'together/meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together'}, 'type': 'metric', 'metric': 'prom...
INFO 2025-09-10 14:55:22,876 console_span_processor:62 telemetry: 21:55:22.832 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:22,877 console_span_processor:67 telemetry: value: 643
INFO 2025-09-10 14:55:22,878 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:22,878 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:22,879 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:22,879 console_span_processor:62 telemetry: 21:55:22.832 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:22,880 console_span_processor:67 telemetry: value: 23
INFO 2025-09-10 14:55:22,881 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:22,881 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:22,882 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:22,882 console_span_processor:62 telemetry: 21:55:22.832 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:22,883 console_span_processor:67 telemetry: value: 666
INFO 2025-09-10 14:55:22,886 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:22,887 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:22,888 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:22,913 console_span_processor:39 telemetry: 21:55:22.891 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (704.86ms)
INFO 2025-09-10 14:55:22,915 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:22,915 console_span_processor:62 telemetry: 21:55:22.835 [INFO] ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:57:34,753 uvicorn.error:264 uncategorized: Shutting down
INFO 2025-09-10 14:57:34,867 uvicorn.error:67 uncategorized: Waiting for application shutdown.
INFO 2025-09-10 14:57:34,868 __main__:170 core::server: Shutting down
INFO 2025-09-10 14:57:34,868 llama_stack.core.stack:357 core: Shutting down ModelsRoutingTable
INFO 2025-09-10 14:57:34,869 llama_stack.core.stack:357 core: Shutting down DatasetsRoutingTable
INFO 2025-09-10 14:57:34,870 llama_stack.core.stack:357 core: Shutting down DatasetIORouter
INFO 2025-09-10 14:57:34,870 llama_stack.core.stack:357 core: Shutting down TelemetryAdapter
INFO 2025-09-10 14:57:34,871 llama_stack.core.stack:357 core: Shutting down InferenceRouter
INFO 2025-09-10 14:57:34,874 llama_stack.core.stack:357 core: Shutting down LocalfsFilesImpl
INFO 2025-09-10 14:57:34,875 llama_stack.core.stack:357 core: Shutting down ShieldsRoutingTable
INFO 2025-09-10 14:57:34,876 llama_stack.core.stack:357 core: Shutting down SafetyRouter
INFO 2025-09-10 14:57:34,877 llama_stack.core.stack:357 core: Shutting down VectorDBsRoutingTable
INFO 2025-09-10 14:57:34,877 llama_stack.core.stack:357 core: Shutting down VectorIORouter
INFO 2025-09-10 14:57:34,878 llama_stack.core.stack:357 core: Shutting down ToolGroupsRoutingTable
INFO 2025-09-10 14:57:34,878 llama_stack.core.stack:357 core: Shutting down ToolRuntimeRouter
INFO 2025-09-10 14:57:34,879 llama_stack.core.stack:357 core: Shutting down MetaReferenceAgentsImpl
INFO 2025-09-10 14:57:34,879 llama_stack.core.stack:357 core: Shutting down TorchtunePostTrainingImpl
INFO 2025-09-10 14:57:34,881 llama_stack.core.stack:357 core: Shutting down ScoringFunctionsRoutingTable
INFO 2025-09-10 14:57:34,882 llama_stack.core.stack:357 core: Shutting down ScoringRouter
INFO 2025-09-10 14:57:34,882 llama_stack.core.stack:357 core: Shutting down ReferenceBatchesImpl
INFO 2025-09-10 14:57:34,883 llama_stack.core.stack:357 core: Shutting down BenchmarksRoutingTable
INFO 2025-09-10 14:57:34,884 llama_stack.core.stack:357 core: Shutting down EvalRouter
INFO 2025-09-10 14:57:34,884 llama_stack.core.stack:357 core: Shutting down DistributionInspectImpl
INFO 2025-09-10 14:57:34,885 llama_stack.core.stack:357 core: Shutting down ProviderImpl
INFO 2025-09-10 14:57:34,886 uvicorn.error:76 uncategorized: Application shutdown complete.
INFO 2025-09-10 14:57:34,887 uvicorn.error:94 uncategorized: Finished server process [26795]
/Users/kaiwu/miniconda3/lib/python3.12/multiprocessing/resource_tracker.py:255: UserWarning: resource_tracker: There appear to be 1 leaked semaphore objects to clean up at shutdown
warnings.warn('resource_tracker: There appear to be %d '
Installed 3 packages in 165ms
INFO 2025-09-10 14:47:19,351 llama_stack.core.utils.config_resolution:52 core: Using distribution:
/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
INFO 2025-09-10 14:47:19,353 llama_stack.cli.stack.run:129 cli: Using run configuration:
/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
Using virtual environment: /Users/kaiwu/work/kaiwu/llama-stack/.venv
Virtual environment already activated
+ '[' -n /Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml ']'
+ yaml_config_arg=/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
+ python -m llama_stack.core.server.server /Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml --port 8321
INFO 2025-09-10 14:47:23,918 llama_stack.core.utils.config_resolution:45 core: Using file path:
/Users/kaiwu/work/kaiwu/llama-stack/llama_stack/distributions/starter/run.yaml
INFO 2025-09-10 14:47:23,929 __main__:615 core::server: Run configuration:
INFO 2025-09-10 14:47:23,933 __main__:618 core::server: apis:
- agents
- batches
- datasetio
- eval
- files
- inference
- post_training
- safety
- scoring
- telemetry
- tool_runtime
- vector_io
benchmarks: []
datasets: []
image_name: starter
inference_store:
db_path: /Users/kaiwu/.llama/distributions/starter/inference_store.db
type: sqlite
metadata_store:
db_path: /Users/kaiwu/.llama/distributions/starter/registry.db
type: sqlite
models: []
providers:
agents:
- config:
persistence_store:
db_path: /Users/kaiwu/.llama/distributions/starter/agents_store.db
type: sqlite
responses_store:
db_path: /Users/kaiwu/.llama/distributions/starter/responses_store.db
type: sqlite
provider_id: meta-reference
provider_type: inline::meta-reference
batches:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/batches.db
type: sqlite
provider_id: reference
provider_type: inline::reference
datasetio:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/huggingface_datasetio.db
type: sqlite
provider_id: huggingface
provider_type: remote::huggingface
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/localfs_datasetio.db
type: sqlite
provider_id: localfs
provider_type: inline::localfs
eval:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/meta_reference_eval.db
type: sqlite
provider_id: meta-reference
provider_type: inline::meta-reference
files:
- config:
metadata_store:
db_path: /Users/kaiwu/.llama/distributions/starter/files_metadata.db
type: sqlite
storage_dir: /Users/kaiwu/.llama/distributions/starter/files
provider_id: meta-reference-files
provider_type: inline::localfs
inference:
- config:
api_key: '********'
url: https://api.fireworks.ai/inference/v1
provider_id: fireworks
provider_type: remote::fireworks
- config:
api_key: '********'
url: https://api.together.xyz/v1
provider_id: together
provider_type: remote::together
- config: {}
provider_id: bedrock
provider_type: remote::bedrock
- config:
api_key: '********'
base_url: https://api.openai.com/v1
provider_id: openai
provider_type: remote::openai
- config:
api_key: '********'
provider_id: anthropic
provider_type: remote::anthropic
- config:
api_key: '********'
provider_id: gemini
provider_type: remote::gemini
- config:
api_key: '********'
url: https://api.groq.com
provider_id: groq
provider_type: remote::groq
- config:
api_key: '********'
url: https://api.sambanova.ai/v1
provider_id: sambanova
provider_type: remote::sambanova
- config: {}
provider_id: sentence-transformers
provider_type: inline::sentence-transformers
post_training:
- config:
checkpoint_format: meta
provider_id: torchtune-cpu
provider_type: inline::torchtune-cpu
safety:
- config:
excluded_categories: []
provider_id: llama-guard
provider_type: inline::llama-guard
- config: {}
provider_id: code-scanner
provider_type: inline::code-scanner
scoring:
- config: {}
provider_id: basic
provider_type: inline::basic
- config: {}
provider_id: llm-as-judge
provider_type: inline::llm-as-judge
- config:
openai_api_key: '********'
provider_id: braintrust
provider_type: inline::braintrust
telemetry:
- config:
service_name: "\u200B"
sinks: console,sqlite
sqlite_db_path: /Users/kaiwu/.llama/distributions/starter/trace_store.db
provider_id: meta-reference
provider_type: inline::meta-reference
tool_runtime:
- config:
api_key: '********'
max_results: 3
provider_id: brave-search
provider_type: remote::brave-search
- config:
api_key: '********'
max_results: 3
provider_id: tavily-search
provider_type: remote::tavily-search
- config: {}
provider_id: rag-runtime
provider_type: inline::rag-runtime
- config: {}
provider_id: model-context-protocol
provider_type: remote::model-context-protocol
vector_io:
- config:
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/faiss_store.db
type: sqlite
provider_id: faiss
provider_type: inline::faiss
- config:
db_path: /Users/kaiwu/.llama/distributions/starter/sqlite_vec.db
kvstore:
db_path: /Users/kaiwu/.llama/distributions/starter/sqlite_vec_registry.db
type: sqlite
provider_id: sqlite-vec
provider_type: inline::sqlite-vec
scoring_fns: []
server:
port: 8321
shields: []
tool_groups:
- provider_id: tavily-search
toolgroup_id: builtin::websearch
- provider_id: rag-runtime
toolgroup_id: builtin::rag
vector_dbs: []
version: 2
INFO 2025-09-10 14:47:34,785 llama_stack.core.stack:388 core: starting registry refresh task
INFO 2025-09-10 14:47:34,946 __main__:580 core::server: Listening on ['::', '0.0.0.0']:8321
INFO 2025-09-10 14:47:35,196 uvicorn.error:84 uncategorized: Started server process [26795]
INFO 2025-09-10 14:47:35,197 uvicorn.error:48 uncategorized: Waiting for application startup.
INFO 2025-09-10 14:47:35,198 __main__:168 core::server: Starting up
INFO 2025-09-10 14:47:35,199 uvicorn.error:62 uncategorized: Application startup complete.
INFO 2025-09-10 14:47:35,199 uvicorn.error:216 uncategorized: Uvicorn running on http://['::', '0.0.0.0']:8321 (Press CTRL+C to quit)
INFO 2025-09-10 14:47:36,852 uvicorn.access:473 uncategorized: 127.0.0.1:55733 - "GET /v1/health HTTP/1.1" 200
INFO 2025-09-10 14:47:36,854 console_span_processor:28 telemetry: 21:47:36.854 [START] /v1/health
INFO 2025-09-10 14:47:36,862 console_span_processor:39 telemetry: 21:47:36.855 [END] /v1/health [StatusCode.OK] (1.07ms)
INFO 2025-09-10 14:47:36,865 console_span_processor:48 telemetry: raw_path: /v1/health
INFO 2025-09-10 14:47:36,866 console_span_processor:62 telemetry: 21:47:36.853 [INFO] 127.0.0.1:55733 - "GET /v1/health HTTP/1.1" 200
INFO 2025-09-10 14:48:28,324 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "GET /v1/models HTTP/1.1" 200
INFO 2025-09-10 14:48:28,333 console_span_processor:28 telemetry: 21:48:28.332 [START] /v1/models
INFO 2025-09-10 14:48:28,392 console_span_processor:39 telemetry: 21:48:28.334 [END] ModelsRoutingTable.list_models [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:48:28,410 console_span_processor:48 telemetry: output: {'data': [{'identifier': 'llama_api/Llama-3.3-70B-Instruct',
'provider_resource_id': 'Llama-3.3-70B-Instruct', 'provider_id': 'llama_api', 'type': 'model', 'metadata': {}, 'model_type': 'llm'},
{'identifier': 'llama_api/Llama-4-Maverick-17B-128E-Instruct-FP8', 'provider_resource_id': 'Llama-4-Maverick-17B-128E-Instruct-FP8',
'provider_id': 'llama_api', 'type': 'model', 'metadata': {}, 'model_type': 'llm'}, {'identifier':
'llama_api/Llama-4-Scout-17B-16E-Instruct-FP8', 'provider_resource_id': 'Llama-4-Scout-17B-16E-Instruct-FP8', 'provider_id': 'llama_api',
'type': 'model', 'metadata': {}, 'model_type': 'llm'}, {'identifier': 'meta-llama/Llama-3.3-70B-Instruct', 'provider_resource_id':
'Llama-3.3-70B-Instruct', 'provider_id': 'meta-llama', 'type': 'model', 'metadata': {}, 'model_type': 'llm'}, {'identifier':
'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'provider_resource_id': 'Llama-4-Maverick-17B-128E-Instruct-FP8', 'provider_id':
'meta-llama', 'type': 'model', 'metadata': {...
INFO 2025-09-10 14:48:28,426 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "GET /v1/shields HTTP/1.1" 200
INFO 2025-09-10 14:48:28,465 console_span_processor:39 telemetry: 21:48:28.430 [END] /v1/models [StatusCode.OK] (97.81ms)
INFO 2025-09-10 14:48:28,466 console_span_processor:48 telemetry: raw_path: /v1/models
INFO 2025-09-10 14:48:28,466 console_span_processor:62 telemetry: 21:48:28.330 [INFO] 127.0.0.1:56006 - "GET /v1/models HTTP/1.1" 200
INFO 2025-09-10 14:48:28,468 console_span_processor:28 telemetry: 21:48:28.468 [START] /v1/shields
INFO 2025-09-10 14:48:28,523 console_span_processor:39 telemetry: 21:48:28.469 [END] ShieldsRoutingTable.list_shields [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:48:28,524 console_span_processor:48 telemetry: output: {'data': []}
INFO 2025-09-10 14:48:28,535 console_span_processor:39 telemetry: 21:48:28.527 [END] /v1/shields [StatusCode.OK] (59.54ms)
INFO 2025-09-10 14:48:28,536 console_span_processor:48 telemetry: raw_path: /v1/shields
INFO 2025-09-10 14:48:28,536 console_span_processor:62 telemetry: 21:48:28.427 [INFO] 127.0.0.1:56006 - "GET /v1/shields HTTP/1.1" 200
INFO 2025-09-10 14:48:32,432 console_span_processor:28 telemetry: 21:48:32.432 [START] /v1/openai/v1/files
WARNING 2025-09-10 14:48:32,437 __main__:220 core::server: Could not read or log request body for POST /v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,495 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
WARNING 2025-09-10 14:48:32,502 __main__:220 core::server: Could not read or log request body for POST /v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,514 console_span_processor:39 telemetry: 21:48:32.496 [END] LocalfsFilesImpl.openai_upload_file [StatusCode.OK] (55.21ms)
INFO 2025-09-10 14:48:32,515 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-489db9aae0424745960e3408ff0f477f',
'bytes': 41, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'shipping_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:48:32,523 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,526 console_span_processor:39 telemetry: 21:48:32.516 [END] /v1/openai/v1/files [StatusCode.OK] (84.71ms)
INFO 2025-09-10 14:48:32,528 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/files
INFO 2025-09-10 14:48:32,529 console_span_processor:62 telemetry: 21:48:32.440 [WARN] Could not read or log request body for POST
/v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,529 console_span_processor:62 telemetry: 21:48:32.496 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
WARNING 2025-09-10 14:48:32,531 __main__:220 core::server: Could not read or log request body for POST /v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,532 console_span_processor:28 telemetry: 21:48:32.532 [START] /v1/openai/v1/files
INFO 2025-09-10 14:48:32,540 console_span_processor:39 telemetry: 21:48:32.533 [END] LocalfsFilesImpl.openai_upload_file [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:48:32,545 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-b2f38b0e164347f5a2b6bbe211e33ff3',
'bytes': 48, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'returns_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:48:32,546 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,557 console_span_processor:39 telemetry: 21:48:32.547 [END] /v1/openai/v1/files [StatusCode.OK] (15.42ms)
INFO 2025-09-10 14:48:32,560 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/files
INFO 2025-09-10 14:48:32,562 console_span_processor:62 telemetry: 21:48:32.502 [WARN] Could not read or log request body for POST
/v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,562 console_span_processor:62 telemetry: 21:48:32.526 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,563 console_span_processor:28 telemetry: 21:48:32.563 [START] /v1/openai/v1/files
INFO 2025-09-10 14:48:32,581 console_span_processor:39 telemetry: 21:48:32.565 [END] LocalfsFilesImpl.openai_upload_file [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:48:32,582 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-6f6f157d165a4078b4abef66a095ccd6',
'bytes': 45, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'support.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:48:32,592 console_span_processor:39 telemetry: 21:48:32.584 [END] /v1/openai/v1/files [StatusCode.OK] (20.86ms)
INFO 2025-09-10 14:48:32,592 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/files
INFO 2025-09-10 14:48:32,593 console_span_processor:62 telemetry: 21:48:32.531 [WARN] Could not read or log request body for POST
/v1/openai/v1/files: Stream consumed
INFO 2025-09-10 14:48:32,594 console_span_processor:62 telemetry: 21:48:32.546 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/files HTTP/1.1" 200
INFO 2025-09-10 14:48:32,595 console_span_processor:28 telemetry: 21:48:32.595 [START] /v1/openai/v1/vector_stores
INFO 2025-09-10 14:48:32,601 console_span_processor:39 telemetry: 21:48:32.596 [END] FaissVectorIOAdapter.register_vector_db [StatusCode.OK]
(0.15ms)
INFO 2025-09-10 14:48:32,602 console_span_processor:48 telemetry: output:
INFO 2025-09-10 14:48:32,621 console_span_processor:39 telemetry: 21:48:32.604 [END] VectorDBsRoutingTable.register_vector_db [StatusCode.OK]
(8.25ms)
INFO 2025-09-10 14:48:32,622 console_span_processor:48 telemetry: output: {'identifier': 'vs_dab05212-db05-402c-91ef-57e41797406b',
'provider_resource_id': 'vs_dab05212-db05-402c-91ef-57e41797406b', 'provider_id': 'faiss', 'type': 'vector_db', 'owner': None, 'source':
'via_register_api', 'embedding_model': 'sentence-transformers/all-MiniLM-L6-v2', 'embedding_dimension': 384, 'vector_db_name': 'acme_docs'}
INFO 2025-09-10 14:48:32,631 console_span_processor:39 telemetry: 21:48:32.629 [END] FaissVectorIOAdapter.register_vector_db [StatusCode.OK]
(5.84ms)
INFO 2025-09-10 14:48:32,632 console_span_processor:48 telemetry: output:
INFO 2025-09-10 14:48:32,650 console_span_processor:39 telemetry: 21:48:32.640 [END] LocalfsFilesImpl.openai_retrieve_file [StatusCode.OK]
(2.11ms)
INFO 2025-09-10 14:48:32,655 llama_stack.providers.utils.inference.embedding_mixin:103 providers::utils: Loading sentence transformer for
all-MiniLM-L6-v2...
INFO 2025-09-10 14:48:32,660 console_span_processor:39 telemetry: 21:48:32.651 [END] LocalfsFilesImpl.openai_retrieve_file_content [StatusCode.OK]
(0.22ms)
INFO 2025-09-10 14:48:32,662 console_span_processor:39 telemetry: 21:48:32.661 [END] LocalfsFilesImpl.openai_retrieve_file_content [StatusCode.OK]
(0.23ms)
INFO 2025-09-10 14:48:32,670 console_span_processor:39 telemetry: 21:48:32.664 [END] LocalfsFilesImpl.openai_retrieve_file_content [StatusCode.OK]
(0.20ms)
INFO 2025-09-10 14:48:32,674 console_span_processor:39 telemetry: 21:48:32.672 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.77ms)
INFO 2025-09-10 14:48:32,675 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:48:32,681 console_span_processor:39 telemetry: 21:48:32.677 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.36ms)
INFO 2025-09-10 14:48:32,682 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:48:32,690 console_span_processor:39 telemetry: 21:48:32.683 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.23ms)
INFO 2025-09-10 14:48:32,690 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
WARNING 2025-09-10 14:48:59,202 torchao.kernel.intmm:23 uncategorized: Warning: Detected no triton, on systems without Triton certain kernels will
not work
W0910 14:48:59.847000 26795 torch/distributed/elastic/multiprocessing/redirects.py:29] NOTE: Redirects are currently not supported in Windows or MacOs.
INFO 2025-09-10 14:49:05,098 sentence_transformers.SentenceTransformer:219 uncategorized: Use pytorch device_name: mps
INFO 2025-09-10 14:49:05,099 sentence_transformers.SentenceTransformer:227 uncategorized: Load pretrained SentenceTransformer: all-MiniLM-L6-v2
INFO 2025-09-10 14:49:09,461 console_span_processor:39 telemetry: 21:49:09.453 [END] InferenceRouter.openai_embeddings [StatusCode.OK]
(36781.46ms)
INFO 2025-09-10 14:49:09,462 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371,
-0.03415430337190628, -0.10541579872369766, 0.0700988844037056, -0.03148755803704262, 0.07130879163742065, -0.0025789395440369844, 0.00581...
INFO 2025-09-10 14:49:09,463 console_span_processor:62 telemetry: 21:48:32.656 [INFO] Loading sentence transformer for all-MiniLM-L6-v2...
INFO 2025-09-10 14:49:09,464 console_span_processor:62 telemetry: 21:48:59.203 [WARN] Warning: Detected no triton, on systems without Triton
certain kernels will not work
INFO 2025-09-10 14:49:09,464 console_span_processor:62 telemetry: 21:49:05.099 [INFO] Use pytorch device_name: mps
INFO 2025-09-10 14:49:09,465 console_span_processor:62 telemetry: 21:49:05.100 [INFO] Load pretrained SentenceTransformer: all-MiniLM-L6-v2
INFO 2025-09-10 14:49:09,469 console_span_processor:39 telemetry: 21:49:09.468 [END] FaissVectorIOAdapter.insert_chunks [StatusCode.OK]
(36796.60ms)
INFO 2025-09-10 14:49:09,484 console_span_processor:39 telemetry: 21:49:09.480 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:49:09,484 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,488 console_span_processor:39 telemetry: 21:49:09.486 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:49:09,488 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:49:09,492 console_span_processor:39 telemetry: 21:49:09.490 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.58ms)
INFO 2025-09-10 14:49:09,493 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,924 console_span_processor:39 telemetry: 21:49:09.921 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (441.92ms)
INFO 2025-09-10 14:49:09,926 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.050018310546875, 0.0007208543829619884, 0.048539839684963226, 0.013606906868517399, -0.006504438817501068, 0.004046895541250706,
-0.04984626919031143, -8.024782437132671e-05, -0.02159256860613823, 0.0015519573353230953, 0.10069309175014496, 0.04437215253710747,
-0.022335151210427284, -0.05230937898159027, -0.028983373194932938, -0.049531035125255585, 0.03074926696717739, -0.03056054376065731,
0.021489247679710388, 0.016868554055690765, -0.028984908014535904, -0.07053273916244507, -0.022961033508181572, -0.0717858299612999,
0.0674479678273201, 0.021412895992398262, -0.06054700165987015, 0.021910998970270157, -0.023192649707198143, -0.028992125764489174,
0.025179730728268623, -0.006338999141007662, -0.001874048844911158, 0.009305929765105247, 0.011422501876950264, 0.037604980170726776,
-0.039689771831035614, -0.08734020590782166, -2.2408454242395237e-05, -0.027818966656923294, -0.05882560834288597, 0.0047395736910402...
INFO 2025-09-10 14:49:09,935 console_span_processor:39 telemetry: 21:49:09.928 [END] FaissVectorIOAdapter.insert_chunks [StatusCode.OK] (448.38ms)
INFO 2025-09-10 14:49:09,938 console_span_processor:39 telemetry: 21:49:09.936 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:49:09,939 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,944 console_span_processor:39 telemetry: 21:49:09.942 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.34ms)
INFO 2025-09-10 14:49:09,945 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:49:09,947 console_span_processor:39 telemetry: 21:49:09.946 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:49:09,948 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:09,959 console_span_processor:39 telemetry: 21:49:09.949 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (13.11ms)
INFO 2025-09-10 14:49:09,960 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.07958973944187164, -0.09508923441171646, 0.0747891291975975, -0.0033136801794171333, 0.03454456478357315, 0.041140977293252945,
-0.06803964823484421, 0.014224942773580551, -0.06238540634512901, 0.03782016783952713, -0.030075553804636, 0.07446419447660446,
-0.06111196056008339, 0.029801342636346817, 0.11399323493242264, 0.01820552721619606, 0.00257650064304471, -0.08268020302057266,
-0.08060702681541443, 0.004656659439206123, -0.053371429443359375, -0.03258609026670456, -0.024163667112588882, 0.0012904119212180376,
0.022314254194498062, -0.04680437222123146, -0.03445201367139816, 0.004914817865937948, -0.03131281957030296, 0.010677368380129337,
-0.011123362928628922, -0.022707175463438034, -0.0027590240351855755, 0.014538224786520004, 0.00694124773144722, -0.0027126462664455175,
0.023252086713910103, 0.07095751911401749, -0.030273273587226868, -0.04118560254573822, -0.04669591784477234, -0.028823204338550568,
-0.010...
INFO 2025-09-10 14:49:09,974 console_span_processor:39 telemetry: 21:49:09.961 [END] FaissVectorIOAdapter.insert_chunks [StatusCode.OK] (25.74ms)
INFO 2025-09-10 14:49:09,980 console_span_processor:39 telemetry: 21:49:09.975 [END] LocalfsFilesImpl.openai_retrieve_file [StatusCode.OK]
(37339.17ms)
INFO 2025-09-10 14:49:09,981 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-b2f38b0e164347f5a2b6bbe211e33ff3',
'bytes': 48, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'returns_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:49:09,987 console_span_processor:39 telemetry: 21:49:09.982 [END] LocalfsFilesImpl.openai_retrieve_file [StatusCode.OK]
(37346.24ms)
INFO 2025-09-10 14:49:09,988 console_span_processor:48 telemetry: output: {'object': 'file', 'id': 'file-489db9aae0424745960e3408ff0f477f',
'bytes': 41, 'created_at': 1757540912, 'expires_at': 1789076912, 'filename': 'shipping_policy.txt', 'purpose': 'assistants'}
INFO 2025-09-10 14:49:10,038 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST /v1/openai/v1/vector_stores HTTP/1.1" 200
INFO 2025-09-10 14:49:10,041 console_span_processor:39 telemetry: 21:49:10.039 [END] VectorIORouter.openai_create_vector_store [StatusCode.OK]
(37443.86ms)
INFO 2025-09-10 14:49:10,042 console_span_processor:48 telemetry: output: {'id': 'vs_dab05212-db05-402c-91ef-57e41797406b', 'object':
'vector_store', 'created_at': 1757540912, 'name': 'acme_docs', 'usage_bytes': 0, 'file_counts': {'completed': 3, 'cancelled': 0, 'failed': 0,
'in_progress': 0, 'total': 3}, 'status': 'completed', 'expires_after': None, 'expires_at': None, 'last_active_at': 1757540912, 'metadata':
{'provider_id': 'faiss', 'provider_vector_db_id': 'vs_dab05212-db05-402c-91ef-57e41797406b'}}
INFO 2025-09-10 14:49:10,047 console_span_processor:39 telemetry: 21:49:10.044 [END] /v1/openai/v1/vector_stores [StatusCode.OK] (37449.64ms)
INFO 2025-09-10 14:49:10,047 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/vector_stores
INFO 2025-09-10 14:49:10,048 console_span_processor:62 telemetry: 21:49:10.039 [INFO] 127.0.0.1:56006 - "POST /v1/openai/v1/vector_stores
HTTP/1.1" 200
INFO 2025-09-10 14:49:10,126 console_span_processor:28 telemetry: 21:49:10.126 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:49:10,140 console_span_processor:39 telemetry: 21:49:10.132 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.72ms)
INFO 2025-09-10 14:49:10,142 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:10,155 console_span_processor:39 telemetry: 21:49:10.143 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.34ms)
INFO 2025-09-10 14:49:10,155 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:49:10,160 console_span_processor:39 telemetry: 21:49:10.157 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:49:10,161 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:49:10,258 console_span_processor:39 telemetry: 21:49:10.219 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (88.76ms)
INFO 2025-09-10 14:49:10,266 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:49:10,285 uvicorn.access:473 uncategorized: 127.0.0.1:56006 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:49:10,295 console_span_processor:39 telemetry: 21:49:10.292 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (161.80ms)
INFO 2025-09-10 14:49:10,296 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:49:10,304 console_span_processor:39 telemetry: 21:49:10.299 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (169.86ms)
INFO 2025-09-10 14:49:10,313 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}, {'file_id': '', 'filename': '', 'score': 0.7863530206684866, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:49:10,323 console_span_processor:39 telemetry: 21:49:10.318 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(188.52ms)
INFO 2025-09-10 14:49:10,324 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}, {'file_id': '', 'filename': '', 'score': 0.7863530206684866, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:49:10,329 console_span_processor:39 telemetry: 21:49:10.326 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (199.98ms)
INFO 2025-09-10 14:49:10,336 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:49:10,337 console_span_processor:62 telemetry: 21:49:10.290 [INFO] 127.0.0.1:56006 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:49:57,749 console_span_processor:28 telemetry: 21:49:57.749 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:49:57,758 console_span_processor:39 telemetry: 21:49:57.753 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:49:57,758 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:49:57,761 console_span_processor:39 telemetry: 21:49:57.760 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:49:57,762 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:49:57,766 console_span_processor:39 telemetry: 21:49:57.764 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.51ms)
INFO 2025-09-10 14:49:57,767 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
To disable this warning, you can either:
- Avoid using `tokenizers` before the fork if possible
- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
To disable this warning, you can either:
- Avoid using `tokenizers` before the fork if possible
- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
INFO 2025-09-10 14:50:01,673 console_span_processor:39 telemetry: 21:50:01.672 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (3908.76ms)
INFO 2025-09-10 14:50:01,675 console_span_processor:48 telemetry: output: {'id': 'oAit2Fa-62bZhn-97d2236c1b482510', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': "In the Andes' gentle breeze, a llama's soft eyes gaze with
peaceful ease, its fur a warm and fuzzy tease. With steps both gentle and serene, the llama roams, a symbol of calm, its beauty pure and
supreme.", 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed':
7075179338234292000}], 'created': 1757540999, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 50, 'prompt_tokens': 50, 'total_tokens': 100,
'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 0}, 'prompt': []}
INFO 2025-09-10 14:50:01,687 uvicorn.access:473 uncategorized: ::1:56392 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:50:01,692 console_span_processor:39 telemetry: 21:50:01.688 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(3936.71ms)
INFO 2025-09-10 14:50:01,692 console_span_processor:48 telemetry: output: {'id': 'oAit2Fa-62bZhn-97d2236c1b482510', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': "In the Andes' gentle breeze, a llama's soft eyes gaze with
peaceful ease, its fur a warm and fuzzy tease. With steps both gentle and serene, the llama roams, a symbol of calm, its beauty pure and
supreme.", 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed':
7075179338234292000}], 'created': 1757540999, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 50, 'prompt_tokens': 50, 'total_tokens': 100,
'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 0}, 'prompt': [], 'metrics': [{'trace_id':
'b7f7481d23ea1b2d4b89111888ebe8b3', 'span_id': '60cf33fa222feaf3', 'timestamp': '2025-09-10T21:50:01.687118Z', 'attributes': {'model_id':
'together/me...
INFO 2025-09-10 14:50:01,694 console_span_processor:62 telemetry: 21:50:01.687 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:50:01,695 console_span_processor:67 telemetry: value: 50
INFO 2025-09-10 14:50:01,695 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:50:01,696 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:50:01,696 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:50:01,698 console_span_processor:62 telemetry: 21:50:01.687 [INFO] metric.completion_tokens
INFO 2025-09-10 14:50:01,699 console_span_processor:67 telemetry: value: 50
INFO 2025-09-10 14:50:01,699 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:50:01,700 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:50:01,701 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:50:01,719 console_span_processor:62 telemetry: 21:50:01.687 [INFO] metric.total_tokens
INFO 2025-09-10 14:50:01,723 console_span_processor:67 telemetry: value: 100
INFO 2025-09-10 14:50:01,725 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:50:01,730 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:50:01,733 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:50:01,746 console_span_processor:39 telemetry: 21:50:01.738 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (3989.18ms)
INFO 2025-09-10 14:50:01,747 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:50:01,748 console_span_processor:62 telemetry: 21:50:01.688 [INFO] ::1:56392 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:45,329 console_span_processor:28 telemetry: 21:51:45.329 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:45,371 console_span_processor:39 telemetry: 21:51:45.337 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.30ms)
INFO 2025-09-10 14:51:45,375 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:45,408 console_span_processor:39 telemetry: 21:51:45.377 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:51:45,408 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:45,415 console_span_processor:39 telemetry: 21:51:45.410 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.56ms)
INFO 2025-09-10 14:51:45,415 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:46,425 console_span_processor:39 telemetry: 21:51:46.414 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (1005.10ms)
INFO 2025-09-10 14:51:46,426 console_span_processor:48 telemetry: output: {'id': 'oAitZwc-62bZhn-97d22606494cfa1a', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed':
15009310705663400000}], 'created': 1757541105, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 633,...
INFO 2025-09-10 14:51:46,443 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:46,457 console_span_processor:39 telemetry: 21:51:46.444 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(1106.92ms)
INFO 2025-09-10 14:51:46,458 console_span_processor:48 telemetry: output: {'id': 'oAitZwc-62bZhn-97d22606494cfa1a', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed':
15009310705663400000}], 'created': 1757541105, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 63...
INFO 2025-09-10 14:51:46,459 console_span_processor:62 telemetry: 21:51:46.442 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:46,459 console_span_processor:67 telemetry: value: 495
INFO 2025-09-10 14:51:46,460 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:46,460 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:46,461 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:46,461 console_span_processor:62 telemetry: 21:51:46.442 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:46,462 console_span_processor:67 telemetry: value: 138
INFO 2025-09-10 14:51:46,463 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:46,463 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:46,463 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:46,464 console_span_processor:62 telemetry: 21:51:46.442 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:46,466 console_span_processor:67 telemetry: value: 633
INFO 2025-09-10 14:51:46,466 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:46,467 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:46,467 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:46,522 console_span_processor:39 telemetry: 21:51:46.468 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (1138.88ms)
INFO 2025-09-10 14:51:46,530 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:46,531 console_span_processor:62 telemetry: 21:51:46.443 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:46,532 console_span_processor:28 telemetry: 21:51:46.532 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:46,544 console_span_processor:39 telemetry: 21:51:46.534 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:51:46,544 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:46,551 console_span_processor:39 telemetry: 21:51:46.547 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.27ms)
INFO 2025-09-10 14:51:46,553 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:46,558 console_span_processor:39 telemetry: 21:51:46.556 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.51ms)
INFO 2025-09-10 14:51:46,559 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,003 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,004 console_span_processor:39 telemetry: 21:51:46.991 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (457.59ms)
INFO 2025-09-10 14:51:47,005 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,025 console_span_processor:39 telemetry: 21:51:47.008 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (474.21ms)
INFO 2025-09-10 14:51:47,028 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,038 console_span_processor:39 telemetry: 21:51:47.034 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (500.67ms)
INFO 2025-09-10 14:51:47,040 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,051 console_span_processor:39 telemetry: 21:51:47.043 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(510.32ms)
INFO 2025-09-10 14:51:47,052 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,059 console_span_processor:39 telemetry: 21:51:47.055 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (522.95ms)
INFO 2025-09-10 14:51:47,061 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,063 console_span_processor:62 telemetry: 21:51:47.004 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,066 console_span_processor:28 telemetry: 21:51:47.066 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,072 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,106 console_span_processor:39 telemetry: 21:51:47.086 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.59ms)
INFO 2025-09-10 14:51:47,107 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,121 console_span_processor:39 telemetry: 21:51:47.118 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.85ms)
INFO 2025-09-10 14:51:47,122 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,134 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,141 console_span_processor:39 telemetry: 21:51:47.124 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.22ms)
INFO 2025-09-10 14:51:47,141 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,154 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,155 console_span_processor:39 telemetry: 21:51:47.143 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (57.86ms)
INFO 2025-09-10 14:51:47,156 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,169 console_span_processor:39 telemetry: 21:51:47.159 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (75.34ms)
INFO 2025-09-10 14:51:47,170 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,185 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,204 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,205 console_span_processor:39 telemetry: 21:51:47.173 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (89.84ms)
INFO 2025-09-10 14:51:47,206 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,220 console_span_processor:39 telemetry: 21:51:47.208 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(128.68ms)
INFO 2025-09-10 14:51:47,221 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,236 console_span_processor:39 telemetry: 21:51:47.223 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (157.17ms)
INFO 2025-09-10 14:51:47,237 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,238 console_span_processor:62 telemetry: 21:51:47.074 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,239 console_span_processor:28 telemetry: 21:51:47.239 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,243 console_span_processor:39 telemetry: 21:51:47.241 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:47,244 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,271 console_span_processor:39 telemetry: 21:51:47.249 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (1.66ms)
INFO 2025-09-10 14:51:47,272 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,275 console_span_processor:39 telemetry: 21:51:47.273 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.23ms)
INFO 2025-09-10 14:51:47,275 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,281 console_span_processor:39 telemetry: 21:51:47.276 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (35.50ms)
INFO 2025-09-10 14:51:47,281 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,294 console_span_processor:39 telemetry: 21:51:47.283 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (42.27ms)
INFO 2025-09-10 14:51:47,295 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,298 console_span_processor:39 telemetry: 21:51:47.297 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (56.25ms)
INFO 2025-09-10 14:51:47,299 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,301 console_span_processor:39 telemetry: 21:51:47.300 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(60.15ms)
INFO 2025-09-10 14:51:47,302 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,306 console_span_processor:39 telemetry: 21:51:47.303 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (64.16ms)
INFO 2025-09-10 14:51:47,307 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,307 console_span_processor:62 telemetry: 21:51:47.135 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,308 console_span_processor:28 telemetry: 21:51:47.308 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,316 console_span_processor:39 telemetry: 21:51:47.310 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.14ms)
INFO 2025-09-10 14:51:47,317 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,320 console_span_processor:39 telemetry: 21:51:47.319 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.37ms)
INFO 2025-09-10 14:51:47,321 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,324 console_span_processor:39 telemetry: 21:51:47.323 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:51:47,325 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,327 console_span_processor:39 telemetry: 21:51:47.326 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (16.35ms)
INFO 2025-09-10 14:51:47,327 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,330 console_span_processor:39 telemetry: 21:51:47.329 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (20.00ms)
INFO 2025-09-10 14:51:47,331 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,334 console_span_processor:39 telemetry: 21:51:47.333 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (23.86ms)
INFO 2025-09-10 14:51:47,335 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,338 console_span_processor:39 telemetry: 21:51:47.336 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(27.52ms)
INFO 2025-09-10 14:51:47,339 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,341 console_span_processor:39 telemetry: 21:51:47.340 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (32.36ms)
INFO 2025-09-10 14:51:47,342 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,343 console_span_processor:62 telemetry: 21:51:47.155 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,343 console_span_processor:28 telemetry: 21:51:47.343 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,348 console_span_processor:39 telemetry: 21:51:47.345 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:51:47,348 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,352 console_span_processor:39 telemetry: 21:51:47.350 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.46ms)
INFO 2025-09-10 14:51:47,353 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,355 console_span_processor:39 telemetry: 21:51:47.354 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:47,356 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,358 console_span_processor:39 telemetry: 21:51:47.356 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (11.96ms)
INFO 2025-09-10 14:51:47,358 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,363 console_span_processor:39 telemetry: 21:51:47.360 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (15.81ms)
INFO 2025-09-10 14:51:47,363 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,367 console_span_processor:39 telemetry: 21:51:47.365 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (20.64ms)
INFO 2025-09-10 14:51:47,368 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,371 console_span_processor:39 telemetry: 21:51:47.369 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(25.18ms)
INFO 2025-09-10 14:51:47,371 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,376 console_span_processor:39 telemetry: 21:51:47.373 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (29.29ms)
INFO 2025-09-10 14:51:47,376 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,377 console_span_processor:62 telemetry: 21:51:47.185 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,378 console_span_processor:28 telemetry: 21:51:47.378 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:47,389 console_span_processor:39 telemetry: 21:51:47.379 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.14ms)
INFO 2025-09-10 14:51:47,390 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,393 console_span_processor:39 telemetry: 21:51:47.391 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:47,394 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:47,403 console_span_processor:39 telemetry: 21:51:47.395 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:47,404 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:47,407 console_span_processor:39 telemetry: 21:51:47.405 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (26.41ms)
INFO 2025-09-10 14:51:47,408 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:47,411 console_span_processor:39 telemetry: 21:51:47.409 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (30.37ms)
INFO 2025-09-10 14:51:47,412 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:47,421 console_span_processor:39 telemetry: 21:51:47.413 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (34.69ms)
INFO 2025-09-10 14:51:47,422 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,427 console_span_processor:39 telemetry: 21:51:47.423 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(44.73ms)
INFO 2025-09-10 14:51:47,427 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:47,431 console_span_processor:39 telemetry: 21:51:47.429 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (50.76ms)
INFO 2025-09-10 14:51:47,432 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:47,432 console_span_processor:62 telemetry: 21:51:47.205 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:47,433 console_span_processor:28 telemetry: 21:51:47.433 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:47,443 console_span_processor:39 telemetry: 21:51:47.435 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:47,444 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:47,454 console_span_processor:39 telemetry: 21:51:47.445 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:47,455 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:47,458 console_span_processor:39 telemetry: 21:51:47.456 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:47,459 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:48,137 console_span_processor:39 telemetry: 21:51:48.128 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (672.06ms)
INFO 2025-09-10 14:51:48,138 console_span_processor:48 telemetry: output: {'id': 'oAitaWe-62bZhn-97d22611ebfb168e', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None,
'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed': 12110905932316877000}], 'created':
1757541107, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint':
None, 'usage': {'completion_tokens': 131, 'prompt_tokens': 998, 'total_tokens': 1129, 'completion_tokens_d...
INFO 2025-09-10 14:51:48,140 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:48,152 console_span_processor:39 telemetry: 21:51:48.141 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(706.73ms)
INFO 2025-09-10 14:51:48,153 console_span_processor:48 telemetry: output: {'id': 'oAitaWe-62bZhn-97d22611ebfb168e', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None,
'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed': 12110905932316877000}],
'created': 1757541107, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None,
'system_fingerprint': None, 'usage': {'completion_tokens': 131, 'prompt_tokens': 998, 'total_tokens': 1129, 'completion_tokens...
INFO 2025-09-10 14:51:48,154 console_span_processor:62 telemetry: 21:51:48.140 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:48,155 console_span_processor:67 telemetry: value: 998
INFO 2025-09-10 14:51:48,155 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:48,156 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:48,156 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:48,157 console_span_processor:62 telemetry: 21:51:48.140 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:48,157 console_span_processor:67 telemetry: value: 131
INFO 2025-09-10 14:51:48,158 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:48,158 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:48,159 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:48,159 console_span_processor:62 telemetry: 21:51:48.140 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:48,160 console_span_processor:67 telemetry: value: 1129
INFO 2025-09-10 14:51:48,160 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:48,160 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:48,161 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:48,170 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,182 console_span_processor:39 telemetry: 21:51:48.162 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (728.49ms)
INFO 2025-09-10 14:51:48,183 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:48,183 console_span_processor:62 telemetry: 21:51:48.141 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:48,184 console_span_processor:28 telemetry: 21:51:48.184 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,189 console_span_processor:39 telemetry: 21:51:48.187 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.65ms)
INFO 2025-09-10 14:51:48,190 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,198 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,199 console_span_processor:39 telemetry: 21:51:48.191 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.29ms)
INFO 2025-09-10 14:51:48,201 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,211 console_span_processor:39 telemetry: 21:51:48.204 [END] ModelsRoutingTable.get_model [StatusCode.OK] (1.00ms)
INFO 2025-09-10 14:51:48,213 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,217 console_span_processor:39 telemetry: 21:51:48.215 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (28.70ms)
INFO 2025-09-10 14:51:48,218 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,226 console_span_processor:39 telemetry: 21:51:48.221 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (35.89ms)
INFO 2025-09-10 14:51:48,227 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,235 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,239 console_span_processor:39 telemetry: 21:51:48.229 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (44.29ms)
INFO 2025-09-10 14:51:48,241 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,252 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,252 console_span_processor:39 telemetry: 21:51:48.242 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(57.30ms)
INFO 2025-09-10 14:51:48,253 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,265 console_span_processor:39 telemetry: 21:51:48.255 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (70.68ms)
INFO 2025-09-10 14:51:48,266 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,267 console_span_processor:62 telemetry: 21:51:48.171 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,268 console_span_processor:28 telemetry: 21:51:48.268 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,271 console_span_processor:39 telemetry: 21:51:48.270 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:48,272 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,275 console_span_processor:39 telemetry: 21:51:48.273 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:48,276 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,280 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,283 console_span_processor:39 telemetry: 21:51:48.277 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,284 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,294 console_span_processor:39 telemetry: 21:51:48.287 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (18.00ms)
INFO 2025-09-10 14:51:48,294 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,298 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,307 console_span_processor:39 telemetry: 21:51:48.296 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (27.38ms)
INFO 2025-09-10 14:51:48,308 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,330 console_span_processor:39 telemetry: 21:51:48.309 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (40.46ms)
INFO 2025-09-10 14:51:48,331 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,334 console_span_processor:39 telemetry: 21:51:48.332 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(63.81ms)
INFO 2025-09-10 14:51:48,334 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,359 console_span_processor:39 telemetry: 21:51:48.336 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (67.91ms)
INFO 2025-09-10 14:51:48,360 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,360 console_span_processor:62 telemetry: 21:51:48.199 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,361 console_span_processor:28 telemetry: 21:51:48.361 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,364 console_span_processor:39 telemetry: 21:51:48.363 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:51:48,365 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,369 console_span_processor:39 telemetry: 21:51:48.367 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,369 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,373 console_span_processor:39 telemetry: 21:51:48.371 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.32ms)
INFO 2025-09-10 14:51:48,374 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,377 console_span_processor:39 telemetry: 21:51:48.375 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (12.40ms)
INFO 2025-09-10 14:51:48,378 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,383 console_span_processor:39 telemetry: 21:51:48.379 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (16.82ms)
INFO 2025-09-10 14:51:48,383 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,395 console_span_processor:39 telemetry: 21:51:48.385 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (22.60ms)
INFO 2025-09-10 14:51:48,396 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,409 console_span_processor:39 telemetry: 21:51:48.397 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(35.03ms)
INFO 2025-09-10 14:51:48,414 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,429 console_span_processor:39 telemetry: 21:51:48.418 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (57.22ms)
INFO 2025-09-10 14:51:48,432 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,433 console_span_processor:62 telemetry: 21:51:48.235 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,435 console_span_processor:28 telemetry: 21:51:48.435 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,449 console_span_processor:39 telemetry: 21:51:48.438 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:48,449 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,464 console_span_processor:39 telemetry: 21:51:48.451 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.28ms)
INFO 2025-09-10 14:51:48,465 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,472 console_span_processor:39 telemetry: 21:51:48.467 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:48,473 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,477 console_span_processor:39 telemetry: 21:51:48.475 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (37.21ms)
INFO 2025-09-10 14:51:48,478 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,482 console_span_processor:39 telemetry: 21:51:48.480 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (42.48ms)
INFO 2025-09-10 14:51:48,483 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,486 console_span_processor:39 telemetry: 21:51:48.485 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (47.47ms)
INFO 2025-09-10 14:51:48,487 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,492 console_span_processor:39 telemetry: 21:51:48.488 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(51.57ms)
INFO 2025-09-10 14:51:48,492 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,501 console_span_processor:39 telemetry: 21:51:48.494 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (58.89ms)
INFO 2025-09-10 14:51:48,502 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,503 console_span_processor:62 telemetry: 21:51:48.252 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,504 console_span_processor:28 telemetry: 21:51:48.504 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,511 console_span_processor:39 telemetry: 21:51:48.505 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:48,511 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,518 console_span_processor:39 telemetry: 21:51:48.512 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:48,519 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,546 console_span_processor:39 telemetry: 21:51:48.521 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.38ms)
INFO 2025-09-10 14:51:48,547 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,557 console_span_processor:39 telemetry: 21:51:48.550 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (44.66ms)
INFO 2025-09-10 14:51:48,558 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,563 console_span_processor:39 telemetry: 21:51:48.559 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (54.51ms)
INFO 2025-09-10 14:51:48,564 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,570 console_span_processor:39 telemetry: 21:51:48.565 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (60.37ms)
INFO 2025-09-10 14:51:48,571 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,573 console_span_processor:39 telemetry: 21:51:48.572 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(67.76ms)
INFO 2025-09-10 14:51:48,574 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,577 console_span_processor:39 telemetry: 21:51:48.575 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (71.71ms)
INFO 2025-09-10 14:51:48,577 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,578 console_span_processor:62 telemetry: 21:51:48.280 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,579 console_span_processor:28 telemetry: 21:51:48.579 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:48,587 console_span_processor:39 telemetry: 21:51:48.582 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.48ms)
INFO 2025-09-10 14:51:48,588 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,592 console_span_processor:39 telemetry: 21:51:48.589 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:48,592 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:48,601 console_span_processor:39 telemetry: 21:51:48.594 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,602 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:48,605 console_span_processor:39 telemetry: 21:51:48.603 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (21.97ms)
INFO 2025-09-10 14:51:48,606 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:51:48,609 console_span_processor:39 telemetry: 21:51:48.607 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (26.56ms)
INFO 2025-09-10 14:51:48,609 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:48,614 console_span_processor:39 telemetry: 21:51:48.612 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (31.13ms)
INFO 2025-09-10 14:51:48,615 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,626 console_span_processor:39 telemetry: 21:51:48.616 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(35.85ms)
INFO 2025-09-10 14:51:48,627 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:48,635 console_span_processor:39 telemetry: 21:51:48.632 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (52.29ms)
INFO 2025-09-10 14:51:48,636 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:48,636 console_span_processor:62 telemetry: 21:51:48.299 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:48,637 console_span_processor:28 telemetry: 21:51:48.637 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:48,640 console_span_processor:39 telemetry: 21:51:48.638 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:48,641 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:48,643 console_span_processor:39 telemetry: 21:51:48.642 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:48,643 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:48,653 console_span_processor:39 telemetry: 21:51:48.645 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.14ms)
INFO 2025-09-10 14:51:48,653 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:53,149 console_span_processor:39 telemetry: 21:51:53.146 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (4501.83ms)
INFO 2025-09-10 14:51:53,150 console_span_processor:48 telemetry: output: {'id': 'oAitaoX-4YNCb4-97d22618bd651584', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I should try to use the Llama Stack Vector Store
RAG tool again with a different input to see if I can get a relevant result.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input:
{"query": "shipping time", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None, 'role': 'assistant',
'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed': 7090030016801882000}], 'created': 1757541108, 'model':
'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage':
{'completion_tokens': 89, 'prompt_tokens': 1494, 'total_tokens': 1583, 'completion_tokens_details': None, 'prompt_tokens_details': None,
'cached_tokens': 0}, 'prompt': []}
INFO 2025-09-10 14:51:53,153 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:53,157 console_span_processor:39 telemetry: 21:51:53.153 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(4515.32ms)
INFO 2025-09-10 14:51:53,158 console_span_processor:48 telemetry: output: {'id': 'oAitaoX-4YNCb4-97d22618bd651584', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I should try to use the Llama Stack Vector Store
RAG tool again with a different input to see if I can get a relevant result.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input:
{"query": "shipping time", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1}', 'refusal': None, 'role': 'assistant',
'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed': 7090030016801882000}], 'created': 1757541108,
'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage':
{'completion_tokens': 89, 'prompt_tokens': 1494, 'total_tokens': 1583, 'completion_tokens_details': None, 'prompt_tokens_details': None,
'cached_tokens': 0}, 'prompt': [], 'metrics': [{'trace_id': 'dd10581530aada6b43c22d2c221fafe0', 'span_id': 'ba2f798e...
INFO 2025-09-10 14:51:53,159 console_span_processor:62 telemetry: 21:51:53.152 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:53,160 console_span_processor:67 telemetry: value: 1494
INFO 2025-09-10 14:51:53,160 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:53,160 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:53,161 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:53,161 console_span_processor:62 telemetry: 21:51:53.152 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:53,162 console_span_processor:67 telemetry: value: 89
INFO 2025-09-10 14:51:53,162 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:53,163 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:53,165 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:53,166 console_span_processor:62 telemetry: 21:51:53.152 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:53,166 console_span_processor:67 telemetry: value: 1583
INFO 2025-09-10 14:51:53,167 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:53,167 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:53,167 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:53,183 console_span_processor:39 telemetry: 21:51:53.169 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (4532.11ms)
INFO 2025-09-10 14:51:53,184 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:53,184 console_span_processor:62 telemetry: 21:51:53.153 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:51:53,185 console_span_processor:28 telemetry: 21:51:53.185 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:53,212 console_span_processor:39 telemetry: 21:51:53.187 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:53,213 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:53,232 console_span_processor:39 telemetry: 21:51:53.214 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.34ms)
INFO 2025-09-10 14:51:53,233 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:53,245 console_span_processor:39 telemetry: 21:51:53.234 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:51:53,246 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,285 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,305 console_span_processor:39 telemetry: 21:51:54.289 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (1102.92ms)
INFO 2025-09-10 14:51:54,306 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,318 console_span_processor:39 telemetry: 21:51:54.308 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (1121.71ms)
INFO 2025-09-10 14:51:54,319 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,322 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,342 console_span_processor:39 telemetry: 21:51:54.324 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (1137.83ms)
INFO 2025-09-10 14:51:54,342 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,351 console_span_processor:39 telemetry: 21:51:54.344 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(1157.96ms)
INFO 2025-09-10 14:51:54,353 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,353 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,360 console_span_processor:39 telemetry: 21:51:54.355 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (1170.42ms)
INFO 2025-09-10 14:51:54,360 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,361 console_span_processor:62 telemetry: 21:51:54.293 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,362 console_span_processor:28 telemetry: 21:51:54.362 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,366 console_span_processor:39 telemetry: 21:51:54.364 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:51:54,367 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,373 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,380 console_span_processor:39 telemetry: 21:51:54.369 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.28ms)
INFO 2025-09-10 14:51:54,381 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,389 console_span_processor:39 telemetry: 21:51:54.386 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:51:54,390 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,393 console_span_processor:39 telemetry: 21:51:54.391 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (26.85ms)
INFO 2025-09-10 14:51:54,394 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,425 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,438 console_span_processor:39 telemetry: 21:51:54.411 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (47.55ms)
INFO 2025-09-10 14:51:54,440 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,445 console_span_processor:39 telemetry: 21:51:54.442 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (78.94ms)
INFO 2025-09-10 14:51:54,446 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,457 uvicorn.access:473 uncategorized: 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,457 console_span_processor:39 telemetry: 21:51:54.452 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(89.01ms)
INFO 2025-09-10 14:51:54,459 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,468 console_span_processor:39 telemetry: 21:51:54.463 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (100.62ms)
INFO 2025-09-10 14:51:54,469 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,469 console_span_processor:62 telemetry: 21:51:54.323 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,471 console_span_processor:28 telemetry: 21:51:54.471 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,489 console_span_processor:39 telemetry: 21:51:54.474 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:51:54,490 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,502 console_span_processor:39 telemetry: 21:51:54.495 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (2.67ms)
INFO 2025-09-10 14:51:54,504 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,524 console_span_processor:39 telemetry: 21:51:54.514 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.79ms)
INFO 2025-09-10 14:51:54,526 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,529 console_span_processor:39 telemetry: 21:51:54.527 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (53.95ms)
INFO 2025-09-10 14:51:54,537 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,550 console_span_processor:39 telemetry: 21:51:54.542 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (68.87ms)
INFO 2025-09-10 14:51:54,551 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,557 console_span_processor:39 telemetry: 21:51:54.554 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (81.34ms)
INFO 2025-09-10 14:51:54,559 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,573 console_span_processor:39 telemetry: 21:51:54.564 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(91.94ms)
INFO 2025-09-10 14:51:54,574 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,583 console_span_processor:39 telemetry: 21:51:54.575 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (104.63ms)
INFO 2025-09-10 14:51:54,584 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,584 console_span_processor:62 telemetry: 21:51:54.354 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,585 console_span_processor:28 telemetry: 21:51:54.585 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,591 console_span_processor:39 telemetry: 21:51:54.589 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:51:54,591 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,594 console_span_processor:39 telemetry: 21:51:54.592 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:54,595 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,599 console_span_processor:39 telemetry: 21:51:54.596 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.16ms)
INFO 2025-09-10 14:51:54,599 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,604 console_span_processor:39 telemetry: 21:51:54.602 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (13.16ms)
INFO 2025-09-10 14:51:54,605 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,627 console_span_processor:39 telemetry: 21:51:54.621 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (32.66ms)
INFO 2025-09-10 14:51:54,634 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,643 console_span_processor:39 telemetry: 21:51:54.637 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (49.21ms)
INFO 2025-09-10 14:51:54,644 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,654 console_span_processor:39 telemetry: 21:51:54.646 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(57.62ms)
INFO 2025-09-10 14:51:54,656 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,664 console_span_processor:39 telemetry: 21:51:54.657 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (72.19ms)
INFO 2025-09-10 14:51:54,666 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,670 console_span_processor:62 telemetry: 21:51:54.374 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,673 console_span_processor:28 telemetry: 21:51:54.673 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,687 console_span_processor:39 telemetry: 21:51:54.678 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.38ms)
INFO 2025-09-10 14:51:54,688 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,697 console_span_processor:39 telemetry: 21:51:54.691 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:51:54,698 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,701 console_span_processor:39 telemetry: 21:51:54.699 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:54,704 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,716 console_span_processor:39 telemetry: 21:51:54.706 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (29.72ms)
INFO 2025-09-10 14:51:54,718 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,724 console_span_processor:39 telemetry: 21:51:54.721 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (45.99ms)
INFO 2025-09-10 14:51:54,724 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,727 console_span_processor:39 telemetry: 21:51:54.726 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (51.80ms)
INFO 2025-09-10 14:51:54,728 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,732 console_span_processor:39 telemetry: 21:51:54.730 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(56.53ms)
INFO 2025-09-10 14:51:54,732 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,735 console_span_processor:39 telemetry: 21:51:54.734 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (60.83ms)
INFO 2025-09-10 14:51:54,736 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,736 console_span_processor:62 telemetry: 21:51:54.426 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,737 console_span_processor:28 telemetry: 21:51:54.737 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:51:54,747 console_span_processor:39 telemetry: 21:51:54.740 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:51:54,748 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,752 console_span_processor:39 telemetry: 21:51:54.750 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.22ms)
INFO 2025-09-10 14:51:54,752 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:51:54,755 console_span_processor:39 telemetry: 21:51:54.754 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.32ms)
INFO 2025-09-10 14:51:54,756 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:51:54,758 console_span_processor:39 telemetry: 21:51:54.756 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (17.05ms)
INFO 2025-09-10 14:51:54,761 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.03642994910478592, -0.005766282323747873, -0.028219470754265785, 0.05074828490614891, 0.023913491517305374, -0.056256189942359924,
0.0007000428740866482, 0.02684980072081089, 0.005779022816568613, 0.0757804811000824, 0.02611902356147766, -0.04347166419029236,
-0.07426290959119797, 0.0033695625606924295, -0.03395790979266167, -0.018579166382551193, 0.031040646135807037, -0.06419522315263748,
-0.11664945632219315, 0.011454297229647636, 0.00203332188539207, 0.00506530050188303, -0.05711820721626282, -0.006884930655360222,
0.0057834964245557785, 0.005828470923006535, -0.05446002259850502, -0.032767001539468765, -0.023773472756147385, -0.046458274126052856,
-0.0579390786588192, 0.052776239812374115, -0.017773080617189407, 0.07396063208580017, -0.007082517724484205, -0.006252078805118799,
0.06502724438905716, -0.04769469425082207, 0.08519715070724487, -0.04995475336909294, -0.02040106989443302, -0.024357719346880913, -0....
INFO 2025-09-10 14:51:54,767 console_span_processor:39 telemetry: 21:51:54.762 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (23.20ms)
INFO 2025-09-10 14:51:54,767 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:51:54,772 console_span_processor:39 telemetry: 21:51:54.769 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (30.01ms)
INFO 2025-09-10 14:51:54,773 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,775 console_span_processor:39 telemetry: 21:51:54.774 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(35.79ms)
INFO 2025-09-10 14:51:54,776 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'shipping time', 'data': [{'file_id': '', 'filename': '', 'score': 0.9984249880472625, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:51:54,778 console_span_processor:39 telemetry: 21:51:54.777 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (40.35ms)
INFO 2025-09-10 14:51:54,779 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:51:54,779 console_span_processor:62 telemetry: 21:51:54.457 [INFO] 127.0.0.1:56904 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:51:54,781 console_span_processor:28 telemetry: 21:51:54.781 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:54,790 console_span_processor:39 telemetry: 21:51:54.786 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.82ms)
INFO 2025-09-10 14:51:54,790 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:54,794 console_span_processor:39 telemetry: 21:51:54.792 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.24ms)
INFO 2025-09-10 14:51:54,794 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:51:54,798 console_span_processor:39 telemetry: 21:51:54.796 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:51:54,798 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:51:57,872 console_span_processor:39 telemetry: 21:51:57.868 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (3072.99ms)
INFO 2025-09-10 14:51:57,872 console_span_processor:48 telemetry: output: {'id': 'oAitcfB-4YNCb4-97d2263f6ff7cfe9', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: Since I couldn\'t get a relevant result from the
Llama Stack Vector Store RAG tool, I will provide a general answer to the question "How long does shipping take?".\n\nThe shipping time can
vary depending on the destination, shipping method, and other factors. Typically, shipping times can range from a few days to several weeks
or even months. Here are some general guidelines:\n\n* Domestic shipping: 1-7 business days\n* International shipping: 7-21 business days or
more\n* Express shipping: 1-3 business days\n* Standard shipping: 3-7 business days\n\nPlease note that these are general estimates and the
actual shipping time may vary depending on the specific circumstances.\n\nThought: I now can give a great answer\nFinal Answer: The shipping
time can vary depending on the destination, shipping method, and other factors. Typically, shipping tim...
INFO 2025-09-10 14:51:57,875 uvicorn.access:473 uncategorized: ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:51:57,877 console_span_processor:39 telemetry: 21:51:57.876 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(3091.29ms)
INFO 2025-09-10 14:51:57,878 console_span_processor:48 telemetry: output: {'id': 'oAitcfB-4YNCb4-97d2263f6ff7cfe9', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: Since I couldn\'t get a relevant result from the
Llama Stack Vector Store RAG tool, I will provide a general answer to the question "How long does shipping take?".\n\nThe shipping time can
vary depending on the destination, shipping method, and other factors. Typically, shipping times can range from a few days to several weeks
or even months. Here are some general guidelines:\n\n* Domestic shipping: 1-7 business days\n* International shipping: 7-21 business days or
more\n* Express shipping: 1-3 business days\n* Standard shipping: 3-7 business days\n\nPlease note that these are general estimates and the
actual shipping time may vary depending on the specific circumstances.\n\nThought: I now can give a great answer\nFinal Answer: The shipping
time can vary depending on the destination, shipping method, and other factors. Typically, shipping tim...
INFO 2025-09-10 14:51:57,880 console_span_processor:62 telemetry: 21:51:57.874 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:51:57,880 console_span_processor:67 telemetry: value: 1948
INFO 2025-09-10 14:51:57,881 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:57,881 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:57,881 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:57,882 console_span_processor:62 telemetry: 21:51:57.874 [INFO] metric.completion_tokens
INFO 2025-09-10 14:51:57,882 console_span_processor:67 telemetry: value: 264
INFO 2025-09-10 14:51:57,882 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:57,883 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:57,883 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:57,884 console_span_processor:62 telemetry: 21:51:57.874 [INFO] metric.total_tokens
INFO 2025-09-10 14:51:57,884 console_span_processor:67 telemetry: value: 2212
INFO 2025-09-10 14:51:57,884 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:51:57,885 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:51:57,886 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:51:57,890 console_span_processor:39 telemetry: 21:51:57.887 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (3106.16ms)
INFO 2025-09-10 14:51:57,891 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:51:57,891 console_span_processor:62 telemetry: 21:51:57.875 [INFO] ::1:56900 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:09,448 console_span_processor:28 telemetry: 21:55:09.448 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:09,463 console_span_processor:39 telemetry: 21:55:09.453 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:55:09,465 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:09,478 console_span_processor:39 telemetry: 21:55:09.467 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:55:09,479 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:09,483 console_span_processor:39 telemetry: 21:55:09.480 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:55:09,484 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:11,246 console_span_processor:39 telemetry: 21:55:11.242 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (1762.00ms)
INFO 2025-09-10 14:55:11,247 console_span_processor:48 telemetry: output: {'id': 'oAiuccr-62bZhn-97d22b0209009e58', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed':
3440355828201570300}], 'created': 1757541309, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 633, ...
INFO 2025-09-10 14:55:11,249 uvicorn.access:473 uncategorized: ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:11,259 console_span_processor:39 telemetry: 21:55:11.250 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(1797.12ms)
INFO 2025-09-10 14:55:11,260 console_span_processor:48 telemetry: output: {'id': 'oAiuccr-62bZhn-97d22b0209009e58', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "How long does shipping
take?", I need to search the provided vector store for relevant information. The vector store ID is vs_dab05212-db05-402c-91ef-57e41797406b.
I will use the Llama Stack Vector Store RAG tool to find the most relevant documents.\n\nAction: Llama Stack Vector Store RAG tool\nAction
Input: {"query": "How long does shipping take?", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold":
0}', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed':
3440355828201570300}], 'created': 1757541309, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion',
'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 138, 'prompt_tokens': 495, 'total_tokens': 633...
INFO 2025-09-10 14:55:11,261 console_span_processor:62 telemetry: 21:55:11.248 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:11,261 console_span_processor:67 telemetry: value: 495
INFO 2025-09-10 14:55:11,262 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:11,262 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:11,263 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:11,263 console_span_processor:62 telemetry: 21:55:11.249 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:11,264 console_span_processor:67 telemetry: value: 138
INFO 2025-09-10 14:55:11,264 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:11,265 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:11,265 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:11,265 console_span_processor:62 telemetry: 21:55:11.249 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:11,266 console_span_processor:67 telemetry: value: 633
INFO 2025-09-10 14:55:11,266 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:11,266 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:11,267 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:11,284 console_span_processor:39 telemetry: 21:55:11.268 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (1819.72ms)
INFO 2025-09-10 14:55:11,285 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:11,287 console_span_processor:62 telemetry: 21:55:11.250 [INFO] ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:11,289 console_span_processor:28 telemetry: 21:55:11.289 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:55:11,316 console_span_processor:39 telemetry: 21:55:11.306 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.72ms)
INFO 2025-09-10 14:55:11,317 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:11,325 console_span_processor:39 telemetry: 21:55:11.319 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.33ms)
INFO 2025-09-10 14:55:11,326 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:55:11,337 console_span_processor:39 telemetry: 21:55:11.328 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.26ms)
INFO 2025-09-10 14:55:11,339 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:11,725 uvicorn.access:473 uncategorized: 127.0.0.1:57863 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:11,816 console_span_processor:39 telemetry: 21:55:11.712 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (407.13ms)
INFO 2025-09-10 14:55:11,817 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[0.0018660365603864193, -0.008432421833276749, -0.009860510006546974, 0.07527908682823181, -0.008166038431227207, -0.08819602429866791,
-0.025107912719249725, -0.029266025871038437, 0.014401894062757492, 0.06447950005531311, 0.04112009331583977, -0.04028748720884323,
-0.02221696823835373, -0.009235711768269539, -0.04810388386249542, -0.02784842811524868, 0.016442419961094856, -0.07583750039339066,
-0.06627479195594788, 0.01860453188419342, 0.0008918081293813884, 0.011179491877555847, -0.048671603202819824, -0.021989954635500908,
0.04990514740347862, -0.003409573109820485, -0.06727275997400284, -0.054264623671770096, -0.022502778097987175, -0.03865018114447594,
-0.0471607930958271, 0.01671769842505455, 0.024404950439929962, 0.09877222776412964, -0.01660928875207901, 0.01298862136900425,
0.02916400320827961, -0.0722617655992508, 0.041335687041282654, -0.037857454270124435, -0.02524978667497635, -0.010434110648930073, -0....
INFO 2025-09-10 14:55:11,821 console_span_processor:39 telemetry: 21:55:11.818 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (515.05ms)
INFO 2025-09-10 14:55:11,822 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Acme ships globally in 3-5 business days.',
'metadata': {'document_id': 'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12, 'metadata_token_count': 1}, 'embedding':
[-0.012346820905804634, -0.04591671749949455, 0.00545357633382082, 0.0767817348241806, -0.01030217856168747, -0.07128783315420151,
-0.047789815813302994, -0.0042580426670610905, -0.08333089202642441, 0.03493816778063774, 0.03678377717733383, -0.022125769406557083,
-0.001785362372174859, 0.03860057145357132, 0.017692940309643745, -0.011320478282868862, 0.020480643957853317, -0.14444826543331146,
-0.03509785607457161, -0.08347956091165543, 0.01723267324268818, -0.020868107676506042, -0.04816542565822601, -0.04063615947961807,
-0.02612607553601265, -0.06816241890192032, -0.021907860413193703, -0.05328420177102089, 0.0035953382030129433, -0.060775868594646454,
-0.07895789295434952, 0.08725343644618988, -0.004096562508493662, 0.07713106274604797, 0.04764929413795471, 0.03390089422464371, -0.03...
INFO 2025-09-10 14:55:11,831 console_span_processor:39 telemetry: 21:55:11.824 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (524.43ms)
INFO 2025-09-10 14:55:11,832 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:11,837 console_span_processor:39 telemetry: 21:55:11.834 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(535.84ms)
INFO 2025-09-10 14:55:11,838 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query': 'How
long does shipping take?', 'data': [{'file_id': '', 'filename': '', 'score': 1.0150761400159014, 'attributes': {'document_id':
'file-489db9aae0424745960e3408ff0f477f', 'token_count': 12.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Acme ships
globally in 3-5 business days.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:11,843 console_span_processor:39 telemetry: 21:55:11.840 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (550.67ms)
INFO 2025-09-10 14:55:11,844 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:55:11,844 console_span_processor:62 telemetry: 21:55:11.728 [INFO] 127.0.0.1:57863 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:11,845 console_span_processor:28 telemetry: 21:55:11.845 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:11,848 console_span_processor:39 telemetry: 21:55:11.846 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:55:11,849 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:11,866 console_span_processor:39 telemetry: 21:55:11.850 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.33ms)
INFO 2025-09-10 14:55:11,866 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:11,893 console_span_processor:39 telemetry: 21:55:11.868 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.18ms)
INFO 2025-09-10 14:55:11,894 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:12,290 console_span_processor:39 telemetry: 21:55:12.288 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (421.30ms)
INFO 2025-09-10 14:55:12,291 console_span_processor:48 telemetry: output: {'id': 'oAiudJu-62bZhn-97d22b1098a9ed39', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Acme
ships globally in 3-5 business days.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': []}, 'seed': 9970525031584217000}], 'created': 1757541312, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 25, 'prompt_tokens': 655, 'total_tokens':
680, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 512}, 'prompt': []}
INFO 2025-09-10 14:55:12,297 uvicorn.access:473 uncategorized: ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:12,324 console_span_processor:39 telemetry: 21:55:12.298 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(451.81ms)
INFO 2025-09-10 14:55:12,326 console_span_processor:48 telemetry: output: {'id': 'oAiudJu-62bZhn-97d22b1098a9ed39', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Acme
ships globally in 3-5 business days.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': None}, 'seed': 9970525031584217000}], 'created': 1757541312, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 25, 'prompt_tokens': 655, 'total_tokens':
680, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 512}, 'prompt': [], 'metrics': [{'trace_id':
'b0fe401af1dce917b7278f7a651b67bc', 'span_id': '7130a92e6a6a8fba', 'timestamp': '2025-09-10T21:55:12.297305Z', 'attributes': {'model_id':
'together/meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together'}, 'type': 'metric', 'metric': 'prompt_toke...
INFO 2025-09-10 14:55:12,327 console_span_processor:62 telemetry: 21:55:12.297 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:12,328 console_span_processor:67 telemetry: value: 655
INFO 2025-09-10 14:55:12,328 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:12,329 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:12,329 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:12,329 console_span_processor:62 telemetry: 21:55:12.297 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:12,330 console_span_processor:67 telemetry: value: 25
INFO 2025-09-10 14:55:12,330 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:12,331 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:12,331 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:12,332 console_span_processor:62 telemetry: 21:55:12.297 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:12,332 console_span_processor:67 telemetry: value: 680
INFO 2025-09-10 14:55:12,332 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:12,333 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:12,333 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:12,353 console_span_processor:39 telemetry: 21:55:12.335 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (489.36ms)
INFO 2025-09-10 14:55:12,355 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:12,358 console_span_processor:62 telemetry: 21:55:12.298 [INFO] ::1:57854 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:19,314 console_span_processor:28 telemetry: 21:55:19.314 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:19,320 console_span_processor:39 telemetry: 21:55:19.316 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.15ms)
INFO 2025-09-10 14:55:19,322 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:19,325 console_span_processor:39 telemetry: 21:55:19.323 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.17ms)
INFO 2025-09-10 14:55:19,326 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:19,331 console_span_processor:39 telemetry: 21:55:19.327 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.23ms)
INFO 2025-09-10 14:55:19,332 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:21,608 console_span_processor:39 telemetry: 21:55:21.606 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (2279.25ms)
INFO 2025-09-10 14:55:21,610 console_span_processor:48 telemetry: output: {'id': 'oAiufav-4YNCb4-97d22b3f6cb27af2', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "Can I return a product
after 40 days?", I need to search the vector store to find relevant information about the return policy. I will use the Llama Stack Vector
Store RAG tool to search the provided vector store ID.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input: {"query": "return policy
after 40 days", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold": 0.5}', 'refusal': None, 'role':
'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': []}, 'seed': 17340032880891308000}], 'created':
1757541319, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint':
None, 'usage': {'completion_tokens': 124, 'prompt_tokens': 499, 'total_tokens': 623, 'completion_tokens_details': No...
INFO 2025-09-10 14:55:21,611 uvicorn.access:473 uncategorized: ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:21,631 console_span_processor:39 telemetry: 21:55:21.612 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(2297.16ms)
INFO 2025-09-10 14:55:21,632 console_span_processor:48 telemetry: output: {'id': 'oAiufav-4YNCb4-97d22b3f6cb27af2', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: To answer the question "Can I return a product
after 40 days?", I need to search the vector store to find relevant information about the return policy. I will use the Llama Stack Vector
Store RAG tool to search the provided vector store ID.\n\nAction: Llama Stack Vector Store RAG tool\nAction Input: {"query": "return policy
after 40 days", "vector_store_id": "vs_dab05212-db05-402c-91ef-57e41797406b", "top_k": 1, "score_threshold": 0.5}', 'refusal': None, 'role':
'assistant', 'annotations': None, 'audio': None, 'function_call': None, 'tool_calls': None}, 'seed': 17340032880891308000}], 'created':
1757541319, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object': 'chat.completion', 'service_tier': None, 'system_fingerprint':
None, 'usage': {'completion_tokens': 124, 'prompt_tokens': 499, 'total_tokens': 623, 'completion_tokens_details': ...
INFO 2025-09-10 14:55:21,636 console_span_processor:62 telemetry: 21:55:21.611 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:21,637 console_span_processor:67 telemetry: value: 499
INFO 2025-09-10 14:55:21,638 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:21,638 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:21,639 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:21,639 console_span_processor:62 telemetry: 21:55:21.611 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:21,639 console_span_processor:67 telemetry: value: 124
INFO 2025-09-10 14:55:21,640 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:21,640 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:21,641 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:21,641 console_span_processor:62 telemetry: 21:55:21.611 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:21,641 console_span_processor:67 telemetry: value: 623
INFO 2025-09-10 14:55:21,642 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:21,642 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:21,642 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:21,648 console_span_processor:39 telemetry: 21:55:21.643 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (2329.06ms)
INFO 2025-09-10 14:55:21,649 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:21,650 console_span_processor:62 telemetry: 21:55:21.612 [INFO] ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:55:21,651 console_span_processor:28 telemetry: 21:55:21.651 [START] /v1/openai/v1/vector_stores/{vector_store_id}/search
INFO 2025-09-10 14:55:21,674 console_span_processor:39 telemetry: 21:55:21.654 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.21ms)
INFO 2025-09-10 14:55:21,675 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:21,685 console_span_processor:39 telemetry: 21:55:21.678 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.70ms)
INFO 2025-09-10 14:55:21,687 console_span_processor:48 telemetry: output:
<llama_stack.providers.inline.inference.sentence_transformers.sentence_transformers.SentenceTransformersInferenceImpl object at 0x158e83350>
INFO 2025-09-10 14:55:21,692 console_span_processor:39 telemetry: 21:55:21.689 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.53ms)
INFO 2025-09-10 14:55:21,692 console_span_processor:48 telemetry: output: {'identifier': 'sentence-transformers/all-MiniLM-L6-v2',
'provider_resource_id': 'all-MiniLM-L6-v2', 'provider_id': 'sentence-transformers', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {'embedding_dimension': 384}, 'model_type': 'embedding'}
INFO 2025-09-10 14:55:22,019 uvicorn.access:473 uncategorized: 127.0.0.1:57888 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:22,024 console_span_processor:39 telemetry: 21:55:22.017 [END] InferenceRouter.openai_embeddings [StatusCode.OK] (363.31ms)
INFO 2025-09-10 14:55:22,025 console_span_processor:48 telemetry: output: {'object': 'list', 'data': [{'object': 'embedding', 'embedding':
[-0.0018892501248046756, 0.030758941546082497, 0.10938595235347748, 0.04589828848838806, 0.0006913804681971669, 0.014387426897883415,
-0.015357869677245617, -0.011600838042795658, -0.08975677192211151, 0.053308334201574326, 0.0744965448975563, 0.01633235439658165,
0.010754235088825226, 0.004617820493876934, 0.009704680182039738, -0.03412426635622978, -0.04056152328848839, -0.019626466557383537,
-0.08569952845573425, -0.043116409331560135, 0.025109080597758293, -0.03337268903851509, -0.06306783854961395, 0.021730247884988785,
0.01859521120786667, 0.0934692993760109, -0.02332254685461521, 0.03396535664796829, -0.04177931323647499, -0.011372999288141727,
0.015714162960648537, -0.04297734424471855, -0.06080453842878342, -0.05970568209886551, -0.013541588559746742, 0.04719769209623337,
-0.1263798028230667, -0.09081613272428513, -0.044160086661577225, 0.010452632792294025, -0.04007401689887047, 0.029781267046928406,
-0.03511...
INFO 2025-09-10 14:55:22,031 console_span_processor:39 telemetry: 21:55:22.027 [END] FaissVectorIOAdapter.query_chunks [StatusCode.OK] (373.68ms)
INFO 2025-09-10 14:55:22,032 console_span_processor:48 telemetry: output: {'chunks': [{'content': 'Returns are accepted within 30 days of
purchase.', 'metadata': {'document_id': 'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10, 'metadata_token_count': 1}, 'embedding':
[-0.050018310546875, 0.0007208543829619884, 0.048539839684963226, 0.013606906868517399, -0.006504438817501068, 0.004046895541250706,
-0.04984626919031143, -8.024782437132671e-05, -0.02159256860613823, 0.0015519573353230953, 0.10069309175014496, 0.04437215253710747,
-0.022335151210427284, -0.05230937898159027, -0.028983373194932938, -0.049531035125255585, 0.03074926696717739, -0.03056054376065731,
0.021489247679710388, 0.016868554055690765, -0.028984908014535904, -0.07053273916244507, -0.022961033508181572, -0.0717858299612999,
0.0674479678273201, 0.021412895992398262, -0.06054700165987015, 0.021910998970270157, -0.023192649707198143, -0.028992125764489174,
0.025179730728268623, -0.006338999141007662, -0.001874048844911158, 0.009305929765105247, 0.011422501876950264, 0.0376049801707...
INFO 2025-09-10 14:55:22,057 console_span_processor:39 telemetry: 21:55:22.037 [END] VectorDBsRoutingTable.openai_search_vector_store
[StatusCode.OK] (384.28ms)
INFO 2025-09-10 14:55:22,058 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'return policy after 40 days', 'data': [{'file_id': '', 'filename': '', 'score': 1.3987585167097674, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:22,063 console_span_processor:39 telemetry: 21:55:22.060 [END] VectorIORouter.openai_search_vector_store [StatusCode.OK]
(407.47ms)
INFO 2025-09-10 14:55:22,064 console_span_processor:48 telemetry: output: {'object': 'vector_store.search_results.page', 'search_query':
'return policy after 40 days', 'data': [{'file_id': '', 'filename': '', 'score': 1.3987585167097674, 'attributes': {'document_id':
'file-b2f38b0e164347f5a2b6bbe211e33ff3', 'token_count': 10.0, 'metadata_token_count': 1.0}, 'content': [{'type': 'text', 'text': 'Returns are
accepted within 30 days of purchase.'}]}], 'has_more': False, 'next_page': None}
INFO 2025-09-10 14:55:22,175 console_span_processor:39 telemetry: 21:55:22.096 [END] /v1/openai/v1/vector_stores/{vector_store_id}/search
[StatusCode.OK] (444.58ms)
INFO 2025-09-10 14:55:22,176 console_span_processor:48 telemetry: raw_path:
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search
INFO 2025-09-10 14:55:22,178 console_span_processor:62 telemetry: 21:55:22.021 [INFO] 127.0.0.1:57888 - "POST
/v1/openai/v1/vector_stores/vs_dab05212-db05-402c-91ef-57e41797406b/search HTTP/1.1" 200
INFO 2025-09-10 14:55:22,186 console_span_processor:28 telemetry: 21:55:22.186 [START] /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:22,195 console_span_processor:39 telemetry: 21:55:22.188 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.30ms)
INFO 2025-09-10 14:55:22,196 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:22,218 console_span_processor:39 telemetry: 21:55:22.197 [END] ModelsRoutingTable.get_provider_impl [StatusCode.OK] (0.20ms)
INFO 2025-09-10 14:55:22,220 console_span_processor:48 telemetry: output:
<llama_stack.providers.remote.inference.together.together.TogetherInferenceAdapter object at 0x137069220>
INFO 2025-09-10 14:55:22,227 console_span_processor:39 telemetry: 21:55:22.224 [END] ModelsRoutingTable.get_model [StatusCode.OK] (0.19ms)
INFO 2025-09-10 14:55:22,228 console_span_processor:48 telemetry: output: {'identifier': 'together/meta-llama/Llama-3.3-70B-Instruct-Turbo',
'provider_resource_id': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together', 'type': 'model', 'owner': None, 'source':
'listed_from_provider', 'metadata': {}, 'model_type': 'llm'}
INFO 2025-09-10 14:55:22,805 console_span_processor:39 telemetry: 21:55:22.801 [END] TogetherInferenceAdapter.openai_chat_completion
[StatusCode.OK] (577.41ms)
INFO 2025-09-10 14:55:22,806 console_span_processor:48 telemetry: output: {'id': 'oAiugR1-62bZhn-97d22b51096017f0', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Returns
are accepted within 30 days of purchase.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': []}, 'seed': 2982499907717596700}], 'created': 1757541322, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 23, 'prompt_tokens': 643, 'total_tokens':
666, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 256}, 'prompt': []}
INFO 2025-09-10 14:55:22,834 uvicorn.access:473 uncategorized: ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1" 200
INFO 2025-09-10 14:55:22,873 console_span_processor:39 telemetry: 21:55:22.836 [END] InferenceRouter.openai_chat_completion [StatusCode.OK]
(648.69ms)
INFO 2025-09-10 14:55:22,874 console_span_processor:48 telemetry: output: {'id': 'oAiugR1-62bZhn-97d22b51096017f0', 'choices':
[{'finish_reason': 'stop', 'index': 0, 'logprobs': None, 'message': {'content': 'Thought: I now know the final answer\nFinal Answer: Returns
are accepted within 30 days of purchase.', 'refusal': None, 'role': 'assistant', 'annotations': None, 'audio': None, 'function_call': None,
'tool_calls': None}, 'seed': 2982499907717596700}], 'created': 1757541322, 'model': 'meta-llama/Llama-3.3-70B-Instruct-Turbo', 'object':
'chat.completion', 'service_tier': None, 'system_fingerprint': None, 'usage': {'completion_tokens': 23, 'prompt_tokens': 643, 'total_tokens':
666, 'completion_tokens_details': None, 'prompt_tokens_details': None, 'cached_tokens': 256}, 'prompt': [], 'metrics': [{'trace_id':
'd588c782bd804c0cb49e43ac8c028e7a', 'span_id': '396bc114a416fc6c', 'timestamp': '2025-09-10T21:55:22.832220Z', 'attributes': {'model_id':
'together/meta-llama/Llama-3.3-70B-Instruct-Turbo', 'provider_id': 'together'}, 'type': 'metric', 'metric': 'prom...
INFO 2025-09-10 14:55:22,876 console_span_processor:62 telemetry: 21:55:22.832 [INFO] metric.prompt_tokens
INFO 2025-09-10 14:55:22,877 console_span_processor:67 telemetry: value: 643
INFO 2025-09-10 14:55:22,878 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:22,878 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:22,879 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:22,879 console_span_processor:62 telemetry: 21:55:22.832 [INFO] metric.completion_tokens
INFO 2025-09-10 14:55:22,880 console_span_processor:67 telemetry: value: 23
INFO 2025-09-10 14:55:22,881 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:22,881 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:22,882 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:22,882 console_span_processor:62 telemetry: 21:55:22.832 [INFO] metric.total_tokens
INFO 2025-09-10 14:55:22,883 console_span_processor:67 telemetry: value: 666
INFO 2025-09-10 14:55:22,886 console_span_processor:67 telemetry: unit: tokens
INFO 2025-09-10 14:55:22,887 console_span_processor:67 telemetry: model_id: together/meta-llama/Llama-3.3-70B-Instruct-Turbo
INFO 2025-09-10 14:55:22,888 console_span_processor:67 telemetry: provider_id: together
INFO 2025-09-10 14:55:22,913 console_span_processor:39 telemetry: 21:55:22.891 [END] /v1/openai/v1/chat/completions [StatusCode.OK] (704.86ms)
INFO 2025-09-10 14:55:22,915 console_span_processor:48 telemetry: raw_path: /v1/openai/v1/chat/completions
INFO 2025-09-10 14:55:22,915 console_span_processor:62 telemetry: 21:55:22.835 [INFO] ::1:57884 - "POST /v1/openai/v1/chat/completions HTTP/1.1"
200
INFO 2025-09-10 14:57:34,753 uvicorn.error:264 uncategorized: Shutting down
INFO 2025-09-10 14:57:34,867 uvicorn.error:67 uncategorized: Waiting for application shutdown.
INFO 2025-09-10 14:57:34,868 __main__:170 core::server: Shutting down
INFO 2025-09-10 14:57:34,868 llama_stack.core.stack:357 core: Shutting down ModelsRoutingTable
INFO 2025-09-10 14:57:34,869 llama_stack.core.stack:357 core: Shutting down DatasetsRoutingTable
INFO 2025-09-10 14:57:34,870 llama_stack.core.stack:357 core: Shutting down DatasetIORouter
INFO 2025-09-10 14:57:34,870 llama_stack.core.stack:357 core: Shutting down TelemetryAdapter
INFO 2025-09-10 14:57:34,871 llama_stack.core.stack:357 core: Shutting down InferenceRouter
INFO 2025-09-10 14:57:34,874 llama_stack.core.stack:357 core: Shutting down LocalfsFilesImpl
INFO 2025-09-10 14:57:34,875 llama_stack.core.stack:357 core: Shutting down ShieldsRoutingTable
INFO 2025-09-10 14:57:34,876 llama_stack.core.stack:357 core: Shutting down SafetyRouter
INFO 2025-09-10 14:57:34,877 llama_stack.core.stack:357 core: Shutting down VectorDBsRoutingTable
INFO 2025-09-10 14:57:34,877 llama_stack.core.stack:357 core: Shutting down VectorIORouter
INFO 2025-09-10 14:57:34,878 llama_stack.core.stack:357 core: Shutting down ToolGroupsRoutingTable
INFO 2025-09-10 14:57:34,878 llama_stack.core.stack:357 core: Shutting down ToolRuntimeRouter
INFO 2025-09-10 14:57:34,879 llama_stack.core.stack:357 core: Shutting down MetaReferenceAgentsImpl
INFO 2025-09-10 14:57:34,879 llama_stack.core.stack:357 core: Shutting down TorchtunePostTrainingImpl
INFO 2025-09-10 14:57:34,881 llama_stack.core.stack:357 core: Shutting down ScoringFunctionsRoutingTable
INFO 2025-09-10 14:57:34,882 llama_stack.core.stack:357 core: Shutting down ScoringRouter
INFO 2025-09-10 14:57:34,882 llama_stack.core.stack:357 core: Shutting down ReferenceBatchesImpl
INFO 2025-09-10 14:57:34,883 llama_stack.core.stack:357 core: Shutting down BenchmarksRoutingTable
INFO 2025-09-10 14:57:34,884 llama_stack.core.stack:357 core: Shutting down EvalRouter
INFO 2025-09-10 14:57:34,884 llama_stack.core.stack:357 core: Shutting down DistributionInspectImpl
INFO 2025-09-10 14:57:34,885 llama_stack.core.stack:357 core: Shutting down ProviderImpl
INFO 2025-09-10 14:57:34,886 uvicorn.error:76 uncategorized: Application shutdown complete.
INFO 2025-09-10 14:57:34,887 uvicorn.error:94 uncategorized: Finished server process [26795]
/Users/kaiwu/miniconda3/lib/python3.12/multiprocessing/resource_tracker.py:255: UserWarning: resource_tracker: There appear to be 1 leaked semaphore objects to clean up at shutdown
warnings.warn('resource_tracker: There appear to be %d '