From faf891b40c6236821ba9730e11d985582aad4b9a Mon Sep 17 00:00:00 2001
From: IAN MILLER <75687988+r3v5@users.noreply.github.com>
Date: Tue, 2 Sep 2025 18:38:35 +0100
Subject: [PATCH 01/76] refactor: use generic WeightedInMemoryAggregator for
 hybrid search in SQLiteVecIndex (#3303)

# What does this PR do?
<!-- Provide a short summary of what this PR does and why. Link to
relevant issues if applicable. -->
The purpose of this PR is to refactor `SQLiteVecIndex` to eliminate
redundant code and simplify the code using generic
`WeightedInMemoryAggregator` that can be used for any vector db
provider. This pattern is already implemented for `PGVectorIndex` in
#3064

CC: @franciscojavierarceo

<!-- If resolving an issue, uncomment and update the line below -->
<!-- Closes #[issue-number] -->

## Test Plan
<!-- Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.* -->
1. `./scripts/unit-tests.sh`
2. Integration tests in CI Workflow
---
 .../inline/vector_io/sqlite_vec/sqlite_vec.py | 67 ++-----------------
 1 file changed, 5 insertions(+), 62 deletions(-)

diff --git a/llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py b/llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py
index 7cf163960..f34f8f6fb 100644
--- a/llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py
+++ b/llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py
@@ -30,11 +30,11 @@ from llama_stack.providers.utils.kvstore.api import KVStore
 from llama_stack.providers.utils.memory.openai_vector_store_mixin import OpenAIVectorStoreMixin
 from llama_stack.providers.utils.memory.vector_store import (
     RERANKER_TYPE_RRF,
-    RERANKER_TYPE_WEIGHTED,
     ChunkForDeletion,
     EmbeddingIndex,
     VectorDBWithIndex,
 )
+from llama_stack.providers.utils.vector_io.vector_utils import WeightedInMemoryAggregator
 
 logger = get_logger(name=__name__, category="vector_io")
 
@@ -66,59 +66,6 @@ def _create_sqlite_connection(db_path):
     return connection
 
 
-def _normalize_scores(scores: dict[str, float]) -> dict[str, float]:
-    """Normalize scores to [0,1] range using min-max normalization."""
-    if not scores:
-        return {}
-    min_score = min(scores.values())
-    max_score = max(scores.values())
-    score_range = max_score - min_score
-    if score_range > 0:
-        return {doc_id: (score - min_score) / score_range for doc_id, score in scores.items()}
-    return dict.fromkeys(scores, 1.0)
-
-
-def _weighted_rerank(
-    vector_scores: dict[str, float],
-    keyword_scores: dict[str, float],
-    alpha: float = 0.5,
-) -> dict[str, float]:
-    """ReRanker that uses weighted average of scores."""
-    all_ids = set(vector_scores.keys()) | set(keyword_scores.keys())
-    normalized_vector_scores = _normalize_scores(vector_scores)
-    normalized_keyword_scores = _normalize_scores(keyword_scores)
-
-    return {
-        doc_id: (alpha * normalized_keyword_scores.get(doc_id, 0.0))
-        + ((1 - alpha) * normalized_vector_scores.get(doc_id, 0.0))
-        for doc_id in all_ids
-    }
-
-
-def _rrf_rerank(
-    vector_scores: dict[str, float],
-    keyword_scores: dict[str, float],
-    impact_factor: float = 60.0,
-) -> dict[str, float]:
-    """ReRanker that uses Reciprocal Rank Fusion."""
-    # Convert scores to ranks
-    vector_ranks = {
-        doc_id: i + 1 for i, (doc_id, _) in enumerate(sorted(vector_scores.items(), key=lambda x: x[1], reverse=True))
-    }
-    keyword_ranks = {
-        doc_id: i + 1 for i, (doc_id, _) in enumerate(sorted(keyword_scores.items(), key=lambda x: x[1], reverse=True))
-    }
-
-    all_ids = set(vector_scores.keys()) | set(keyword_scores.keys())
-    rrf_scores = {}
-    for doc_id in all_ids:
-        vector_rank = vector_ranks.get(doc_id, float("inf"))
-        keyword_rank = keyword_ranks.get(doc_id, float("inf"))
-        # RRF formula: score = 1/(k + r) where k is impact_factor and r is the rank
-        rrf_scores[doc_id] = (1.0 / (impact_factor + vector_rank)) + (1.0 / (impact_factor + keyword_rank))
-    return rrf_scores
-
-
 def _make_sql_identifier(name: str) -> str:
     return re.sub(r"[^a-zA-Z0-9_]", "_", name)
 
@@ -398,14 +345,10 @@ class SQLiteVecIndex(EmbeddingIndex):
             for chunk, score in zip(keyword_response.chunks, keyword_response.scores, strict=False)
         }
 
-        # Combine scores using the specified reranker
-        if reranker_type == RERANKER_TYPE_WEIGHTED:
-            alpha = reranker_params.get("alpha", 0.5)
-            combined_scores = _weighted_rerank(vector_scores, keyword_scores, alpha)
-        else:
-            # Default to RRF for None, RRF, or any unknown types
-            impact_factor = reranker_params.get("impact_factor", 60.0)
-            combined_scores = _rrf_rerank(vector_scores, keyword_scores, impact_factor)
+        # Combine scores using the reranking utility
+        combined_scores = WeightedInMemoryAggregator.combine_search_results(
+            vector_scores, keyword_scores, reranker_type, reranker_params
+        )
 
         # Sort by combined score and get top k results
         sorted_items = sorted(combined_scores.items(), key=lambda x: x[1], reverse=True)

From c59d8c504742d0457b215ae4b6cfc60a67b67595 Mon Sep 17 00:00:00 2001
From: Varsha <varshaprasad96@gmail.com>
Date: Wed, 3 Sep 2025 00:59:16 -0700
Subject: [PATCH 02/76] fix: Fix mock vector DB schema in Qdrant tests (#3295)

# What does this PR do?
Fix: https://github.com/llamastack/llama-stack/issues/3293
<!-- If resolving an issue, uncomment and update the line below -->
<!-- Closes #[issue-number] -->

## Test Plan
<!-- Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.* -->
```
===================================================== test session starts =====================================================
platform darwin -- Python 3.12.11, pytest-7.4.4, pluggy-1.5.0 -- /Users/vnarsing/miniconda3/envs/stack-client/bin/python
cachedir: .pytest_cache
metadata: {'Python': '3.12.11', 'Platform': 'macOS-14.7.7-arm64-arm-64bit', 'Packages': {'pytest': '7.4.4', 'pluggy': '1.5.0'}, 'Plugins': {'asyncio': '0.23.8', 'cov': '6.0.0', 'timeout': '2.2.0', 'socket': '0.7.0', 'xdist': '3.8.0', 'html': '3.1.1', 'langsmith': '0.3.39', 'anyio': '4.8.0', 'metadata': '3.0.0'}}
rootdir: /Users/vnarsing/go/src/github/meta-llama/llama-stack
configfile: pyproject.toml
plugins: asyncio-0.23.8, cov-6.0.0, timeout-2.2.0, socket-0.7.0, xdist-3.8.0, html-3.1.1, langsmith-0.3.39, anyio-4.8.0, metadata-3.0.0
asyncio: mode=Mode.AUTO
collected 3 items

tests/unit/providers/vector_io/test_qdrant.py::test_qdrant_adapter_returns_expected_chunks[2-2] PASSED                  [ 33%]
tests/unit/providers/vector_io/test_qdrant.py::test_qdrant_adapter_returns_expected_chunks[100-60] PASSED               [ 66%]
tests/unit/providers/vector_io/test_qdrant.py::test_qdrant_register_and_unregister_vector_db PASSED                     [100%]
```

Co-authored-by: Francisco Arceo <arceofrancisco@gmail.com>
---
 tests/unit/providers/vector_io/test_qdrant.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/unit/providers/vector_io/test_qdrant.py b/tests/unit/providers/vector_io/test_qdrant.py
index d7900dbfd..aab5b6f45 100644
--- a/tests/unit/providers/vector_io/test_qdrant.py
+++ b/tests/unit/providers/vector_io/test_qdrant.py
@@ -54,7 +54,9 @@ def mock_vector_db(vector_db_id) -> MagicMock:
     mock_vector_db.identifier = vector_db_id
     mock_vector_db.embedding_dimension = 384
     mock_vector_db.model_dump_json.return_value = (
-        '{"identifier": "' + vector_db_id + '", "embedding_model": "embedding_model", "embedding_dimension": 384}'
+        '{"identifier": "'
+        + vector_db_id
+        + '", "provider_id": "qdrant", "embedding_model": "embedding_model", "embedding_dimension": 384}'
     )
     return mock_vector_db
 

From ccaf6aaa511a544948a6cf8a99e13ca200852c40 Mon Sep 17 00:00:00 2001
From: Cesare Pompeiano <cesare.pompeiano@gmail.com>
Date: Wed, 3 Sep 2025 11:33:35 +0200
Subject: [PATCH 03/76] chore(python-deps): replace ibm_watson_machine_learning
 with ibm_watsonx_ai (#3302)

# What does this PR do?

This PR updates the Watsonx provider dependencies from
`ibm_watson_machine_learning` to `ibm_watsonx_ai`.

The old package `ibm_watson_machine_learning` is in **deprecation mode**
([[PyPI
link](https://pypi.org/project/ibm-watson-machine-learning/)](https://pypi.org/project/ibm-watson-machine-learning/))
and relies on older versions of dependencies such as `pandas`. Updating
to `ibm_watsonx_ai` ensures compatibility with current dependency
versions and ongoing support.

## Test Plan

I verified the update by running an inference using a model provided by
Watsonx. The model ran successfully, confirming that the new dependency
works as expected.

Co-authored-by: are-ces <cpompeia@redhat.com>
---
 llama_stack/providers/registry/inference.py               | 2 +-
 llama_stack/providers/remote/inference/watsonx/watsonx.py | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index 6264de7c7..fb841afdf 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -292,7 +292,7 @@ Available Models:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="watsonx",
-                pip_packages=["ibm_watson_machine_learning"],
+                pip_packages=["ibm_watsonx_ai"],
                 module="llama_stack.providers.remote.inference.watsonx",
                 config_class="llama_stack.providers.remote.inference.watsonx.WatsonXConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.watsonx.WatsonXProviderDataValidator",
diff --git a/llama_stack/providers/remote/inference/watsonx/watsonx.py b/llama_stack/providers/remote/inference/watsonx/watsonx.py
index 78161d1cb..cb7fc175f 100644
--- a/llama_stack/providers/remote/inference/watsonx/watsonx.py
+++ b/llama_stack/providers/remote/inference/watsonx/watsonx.py
@@ -7,8 +7,8 @@
 from collections.abc import AsyncGenerator, AsyncIterator
 from typing import Any
 
-from ibm_watson_machine_learning.foundation_models import Model
-from ibm_watson_machine_learning.metanames import GenTextParamsMetaNames as GenParams
+from ibm_watsonx_ai.foundation_models import Model
+from ibm_watsonx_ai.metanames import GenTextParamsMetaNames as GenParams
 from openai import AsyncOpenAI
 
 from llama_stack.apis.common.content_types import InterleavedContent, InterleavedContentItem

From d948e63340b37d1dd5f13fa2bb2e380db0f337ec Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Wed, 3 Sep 2025 07:11:59 -0700
Subject: [PATCH 04/76] chore: Improve error message for missing provider
 dependencies (#3315)

Generated with CC:

Replace cryptic KeyError with clear, actionable error message that
shows:
- Which API the failing provider belongs to
- The provider ID and type that's failing
- Which dependency is missing
- Clear instructions on how to fix the issue


## Test plan
Use a run config with Agents API and no safety provider

Before: KeyError: <Api.safety: 'safety'>
After: Failed to resolve 'agents' provider 'meta-reference' of type
'inline::meta-reference': required dependency 'safety' is not available.
Please add a 'safety' provider to your configuration or check if the
provider is properly configured.
---
 llama_stack/core/resolver.py | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/llama_stack/core/resolver.py b/llama_stack/core/resolver.py
index 7ac98dac8..a8ad03e1a 100644
--- a/llama_stack/core/resolver.py
+++ b/llama_stack/core/resolver.py
@@ -284,7 +284,15 @@ async def instantiate_providers(
         if provider.provider_id is None:
             continue
 
-        deps = {a: impls[a] for a in provider.spec.api_dependencies}
+        try:
+            deps = {a: impls[a] for a in provider.spec.api_dependencies}
+        except KeyError as e:
+            missing_api = e.args[0]
+            raise RuntimeError(
+                f"Failed to resolve '{provider.spec.api.value}' provider '{provider.provider_id}' of type '{provider.spec.provider_type}': "
+                f"required dependency '{missing_api.value}' is not available. "
+                f"Please add a '{missing_api.value}' provider to your configuration or check if the provider is properly configured."
+            ) from e
         for a in provider.spec.optional_api_dependencies:
             if a in impls:
                 deps[a] = impls[a]

From c3d3a0b83333a720886c4a846e41ed3ad2766e00 Mon Sep 17 00:00:00 2001
From: Ashwin Bharambe <ashwin.bharambe@gmail.com>
Date: Wed, 3 Sep 2025 11:33:03 -0700
Subject: [PATCH 05/76] feat(tests): auto-merge all model list responses and
 unify recordings (#3320)

One needed to specify record-replay related environment variables for
running integration tests. We could not use defaults because integration
tests could be run against Ollama instances which could be running
different models. For example, text vs vision tests needed separate
instances of Ollama because a single instance typically cannot serve
both of these models if you assume the standard CI worker configuration
on Github. As a result, `client.list()` as returned by the Ollama client
would be different between these runs and we'd end up overwriting
responses.

This PR "solves" it by adding a small amount of complexity -- we store
model list responses specially, keyed by the hashes of the models they
return. At replay time, we merge all of them and pretend that we have
the union of all models available.

## Test Plan

Re-recorded all the tests using `scripts/integration-tests.sh
--inference-mode record`, including the vision tests.
---
 .gitignore                                    |    2 +
 .../contributing/testing/record-replay.md     |    9 +-
 .../remote/inference/ollama/ollama.py         |    8 +-
 llama_stack/testing/inference_recorder.py     |  154 +-
 scripts/integration-tests.sh                  |   14 +-
 tests/README.md                               |   12 -
 tests/integration/README.md                   |   19 +-
 .../recordings/responses/00ba04f74a96.json    |   10 +-
 .../recordings/responses/04172112ffbb.json    |   44 +-
 .../recordings/responses/0b27fd737699.json    |   10 +-
 .../recordings/responses/0b3f2e4754ff.json    |   32 +-
 .../recordings/responses/0e8f2b001dd9.json    |   12 +-
 .../recordings/responses/10eea8c15ddc.json    |   10 +-
 .../recordings/responses/140187e305dc.json    |   12 +-
 .../recordings/responses/17253d7cc667.json    |   10 +-
 .../recordings/responses/173ecb3aab28.json    |   32 +-
 .../recordings/responses/174458ad71b2.json    |   10 +-
 .../recordings/responses/178016edef0e.json    |   10 +-
 .../recordings/responses/197228e26971.json    |   10 +-
 .../recordings/responses/198ef7208389.json    |   10 +-
 .../recordings/responses/1adfaa0e062e.json    |   10 +-
 .../recordings/responses/1b8394f90636.json    |   10 +-
 .../recordings/responses/1b92be674e2a.json    |   10 +-
 .../recordings/responses/1e11c2b20ff8.json    |  768 +-
 .../recordings/responses/211b1562d4e6.json    |   10 +-
 .../recordings/responses/23506e73bb9e.json    |  768 +-
 .../recordings/responses/2afe3b38ca01.json    |   34 +-
 .../recordings/responses/2d187a11704c.json    |  208 +-
 .../recordings/responses/325a72db5755.json    |  758 +-
 .../recordings/responses/382c2f22274c.json    |    8 +-
 .../recordings/responses/3c0bf9ba81b2.json    |    6 +-
 .../recordings/responses/3c3f13cb7794.json    |   30 +-
 .../recordings/responses/3ca695048bee.json    |   14 +-
 .../recordings/responses/3dff18060ebc.json    |  768 +-
 .../recordings/responses/417020320684.json    |  768 +-
 .../recordings/responses/4420515208a8.json    |  768 +-
 .../recordings/responses/44a1d9de0602.json    |    4 +-
 .../recordings/responses/44fb9cf5875f.json    |   10 +-
 .../recordings/responses/48d2fb183a2a.json    |   10 +-
 .../recordings/responses/50340cd4d253.json    |   10 +-
 .../recordings/responses/5370751803dc.json    |  768 +-
 .../recordings/responses/545d86510a80.json    |   34 +-
 .../recordings/responses/554de3cd986f.json    |   46 +-
 .../recordings/responses/561746e1c8de.json    |   30 +-
 .../recordings/responses/563b994bb7d1.json    |   10 +-
 .../recordings/responses/5f5d16afadb4.json    |   30 +-
 .../recordings/responses/62aa454ea5f9.json    |  768 +-
 .../recordings/responses/6906a6e71988.json    |   10 +-
 .../recordings/responses/6cc063bbd7d3.json    |   48 +-
 .../recordings/responses/6d35c91287e2.json    |   34 +-
 .../recordings/responses/6f96090aa955.json    |  178 +-
 .../recordings/responses/6fbea1abca7c.json    |   46 +-
 .../recordings/responses/6fe1d4fedf12.json    | 9570 +++++++++--------
 .../recordings/responses/70adef2c30c4.json    |   10 +-
 .../recordings/responses/72c1126ff2f9.json    |  768 +-
 .../recordings/responses/7354ec181984.json    |   10 +-
 .../recordings/responses/75d0dd9d0fa3.json    |   10 +-
 .../recordings/responses/7b25b702ea18.json    |  768 +-
 .../recordings/responses/7b4815aba6c5.json    |   46 +-
 .../recordings/responses/7e6806cba34a.json    |   34 +-
 .../recordings/responses/802f60021837.json    |  768 +-
 .../recordings/responses/80e4404d8987.json    |   28 +-
 .../recordings/responses/8295382a8e7c.json    |   12 +-
 .../recordings/responses/836f51dfb3c5.json    |   10 +-
 .../recordings/responses/840fbb380b73.json    |   10 +-
 .../recordings/responses/84cab42e1f5c.json    | 1340 +--
 .../recordings/responses/85594a69d74a.json    |   10 +-
 .../recordings/responses/97d3812bfccb.json    |   10 +-
 .../recordings/responses/97e259c0d3e5.json    |   46 +-
 .../recordings/responses/9c140a29ae09.json    |   34 +-
 .../recordings/responses/9c28ec9ac338.json    |   44 +-
 .../recordings/responses/9e651e5fcfe2.json    | 3072 +++---
 .../recordings/responses/9e7a83d3d596.json    |   10 +-
 .../recordings/responses/9fadf5a3d68f.json    |   10 +-
 .../recordings/responses/a0c4df33879f.json    | 2368 ++--
 .../recordings/responses/a4c8d19bb1eb.json    |   12 +-
 .../recordings/responses/a5187d9d5057.json    |   12 +-
 .../recordings/responses/a59d0d7c1485.json    |   10 +-
 .../recordings/responses/a6810c23eda8.json    |   94 +-
 .../recordings/responses/ae1c22f18ecc.json    |   10 +-
 .../recordings/responses/ae6835cfe70e.json    |   10 +-
 .../recordings/responses/b14ff438ca99.json    |   10 +-
 .../recordings/responses/b5e3ed420986.json    |  768 +-
 .../recordings/responses/b612debbd3bf.json    |  768 +-
 .../recordings/responses/bd356b27a085.json    |   24 +-
 .../recordings/responses/c2199d6064db.json    |  768 +-
 .../recordings/responses/c9cba6f3ee38.json    |   10 +-
 .../recordings/responses/cb3df2a1dc22.json    |   12 +-
 .../recordings/responses/cd094caaf1c0.json    |  796 +-
 .../recordings/responses/d0ac68cbde69.json    |   20 +-
 .../recordings/responses/d4c86ac355fb.json    |   10 +-
 .../recordings/responses/d86d4fc1eaca.json    |  768 +-
 .../recordings/responses/dac7a32e5db9.json    |   10 +-
 .../recordings/responses/dd226d71f844.json    |   34 +-
 .../recordings/responses/dd9e7d5913e9.json    |   12 +-
 .../recordings/responses/decfd950646c.json    |   26 +-
 .../recordings/responses/e0a6dce1d94b.json    |  768 +-
 .../recordings/responses/e2c9b07709fe.json    |    8 +-
 .../recordings/responses/e96152610712.json    |   10 +-
 .../recordings/responses/e9c8a0e4f0e0.json    |   12 +-
 .../recordings/responses/ed9e9b34008d.json    |   10 +-
 .../recordings/responses/eee47930e3ae.json    |   46 +-
 .../recordings/responses/ef59cbff54d0.json    |   10 +-
 .../recordings/responses/ef757a75ed08.json    |   26 +-
 .../{vision => }/responses/f1592dee71e5.json  |   14 +-
 .../recordings/responses/f477c2fe1332.json    |   50 +-
 .../recordings/responses/f6d655e91ac3.json    |  768 +-
 .../recordings/responses/f70f30f54211.json    |    8 +-
 .../recordings/responses/fcdef245da95.json    |   10 +-
 .../{vision => }/responses/ff7db0102b28.json  |  658 +-
 .../models-4a3a4447b16b-3057338f.json         |  164 +
 .../recordings/vision/index.sqlite            |  Bin 12288 -> 0 bytes
 .../vision/responses/3877ecf1bc62.json        |   22 -
 .../vision/responses/4096743baf8e.json        |   56 -
 .../vision/responses/4a3a4447b16b.json        |   68 -
 .../vision/responses/67198cbad48f.json        |   56 -
 .../vision/responses/830a1fe14938.json        |   56 -
 .../vision/responses/9c007f300365.json        |   58 -
 .../vision/responses/c9667519ad7c.json        |   58 -
 .../vision/responses/d0ac68cbde69.json        |   19 -
 .../vision/responses/d4f56d7d1996.json        |   56 -
 .../distribution/test_inference_recordings.py |    2 +-
 122 files changed, 17460 insertions(+), 16129 deletions(-)
 rename tests/integration/recordings/{vision => }/responses/f1592dee71e5.json (99%)
 rename tests/integration/recordings/{vision => }/responses/ff7db0102b28.json (98%)
 create mode 100644 tests/integration/recordings/responses/models-4a3a4447b16b-3057338f.json
 delete mode 100644 tests/integration/recordings/vision/index.sqlite
 delete mode 100644 tests/integration/recordings/vision/responses/3877ecf1bc62.json
 delete mode 100644 tests/integration/recordings/vision/responses/4096743baf8e.json
 delete mode 100644 tests/integration/recordings/vision/responses/4a3a4447b16b.json
 delete mode 100644 tests/integration/recordings/vision/responses/67198cbad48f.json
 delete mode 100644 tests/integration/recordings/vision/responses/830a1fe14938.json
 delete mode 100644 tests/integration/recordings/vision/responses/9c007f300365.json
 delete mode 100644 tests/integration/recordings/vision/responses/c9667519ad7c.json
 delete mode 100644 tests/integration/recordings/vision/responses/d0ac68cbde69.json
 delete mode 100644 tests/integration/recordings/vision/responses/d4f56d7d1996.json

diff --git a/.gitignore b/.gitignore
index f3831f29c..11cc59847 100644
--- a/.gitignore
+++ b/.gitignore
@@ -26,5 +26,7 @@ venv/
 pytest-report.xml
 .coverage
 .python-version
+AGENTS.md
+server.log
 CLAUDE.md
 .claude/
diff --git a/docs/source/contributing/testing/record-replay.md b/docs/source/contributing/testing/record-replay.md
index 3049d333c..7b0f345b0 100644
--- a/docs/source/contributing/testing/record-replay.md
+++ b/docs/source/contributing/testing/record-replay.md
@@ -40,18 +40,15 @@ The system patches OpenAI and Ollama client methods to intercept calls before th
 
 ### Storage Architecture
 
-Recordings use a two-tier storage system optimized for both speed and debuggability:
+Recordings are stored as JSON files in the recording directory. They are looked up by their request hash.
 
 ```
 recordings/
-├── index.sqlite          # Fast lookup by request hash
 └── responses/
     ├── abc123def456.json  # Individual response files
     └── def789ghi012.json
 ```
 
-**SQLite index** enables O(log n) hash lookups and metadata queries without loading response bodies.
-
 **JSON files** store complete request/response pairs in human-readable format for debugging.
 
 ## Recording Modes
@@ -166,8 +163,8 @@ This preserves type safety - when replayed, you get the same Pydantic objects wi
 Control recording behavior globally:
 
 ```bash
-export LLAMA_STACK_TEST_INFERENCE_MODE=replay
-export LLAMA_STACK_TEST_RECORDING_DIR=/path/to/recordings
+export LLAMA_STACK_TEST_INFERENCE_MODE=replay   # this is the default
+export LLAMA_STACK_TEST_RECORDING_DIR=/path/to/recordings   # default is tests/integration/recordings
 pytest tests/integration/
 ```
 
diff --git a/llama_stack/providers/remote/inference/ollama/ollama.py b/llama_stack/providers/remote/inference/ollama/ollama.py
index fcaf5ee92..d3d107e1d 100644
--- a/llama_stack/providers/remote/inference/ollama/ollama.py
+++ b/llama_stack/providers/remote/inference/ollama/ollama.py
@@ -118,10 +118,10 @@ class OllamaInferenceAdapter(
 
     async def initialize(self) -> None:
         logger.info(f"checking connectivity to Ollama at `{self.config.url}`...")
-        health_response = await self.health()
-        if health_response["status"] == HealthStatus.ERROR:
+        r = await self.health()
+        if r["status"] == HealthStatus.ERROR:
             logger.warning(
-                "Ollama Server is not running, make sure to start it using `ollama serve` in a separate terminal"
+                f"Ollama Server is not running (message: {r['message']}). Make sure to start it using `ollama serve` in a separate terminal"
             )
 
     async def should_refresh_models(self) -> bool:
@@ -156,7 +156,7 @@ class OllamaInferenceAdapter(
             ),
             Model(
                 identifier="nomic-embed-text",
-                provider_resource_id="nomic-embed-text",
+                provider_resource_id="nomic-embed-text:latest",
                 provider_id=provider_id,
                 metadata={
                     "embedding_dimension": 768,
diff --git a/llama_stack/testing/inference_recorder.py b/llama_stack/testing/inference_recorder.py
index 8fa5f5f2e..5b64e26d3 100644
--- a/llama_stack/testing/inference_recorder.py
+++ b/llama_stack/testing/inference_recorder.py
@@ -30,6 +30,9 @@ from openai.types.completion_choice import CompletionChoice
 CompletionChoice.model_fields["finish_reason"].annotation = Literal["stop", "length", "content_filter"] | None
 CompletionChoice.model_rebuild()
 
+REPO_ROOT = Path(__file__).parent.parent.parent
+DEFAULT_STORAGE_DIR = REPO_ROOT / "tests/integration/recordings"
+
 
 class InferenceMode(StrEnum):
     LIVE = "live"
@@ -51,7 +54,7 @@ def normalize_request(method: str, url: str, headers: dict[str, Any], body: dict
 
 
 def get_inference_mode() -> InferenceMode:
-    return InferenceMode(os.environ.get("LLAMA_STACK_TEST_INFERENCE_MODE", "live").lower())
+    return InferenceMode(os.environ.get("LLAMA_STACK_TEST_INFERENCE_MODE", "replay").lower())
 
 
 def setup_inference_recording():
@@ -60,28 +63,18 @@ def setup_inference_recording():
     to increase their reliability and reduce reliance on expensive, external services.
 
     Currently, this is only supported for OpenAI and Ollama clients. These should cover the vast majority of use cases.
-    Calls to the /models endpoint are not currently trapped. We probably need to add support for this.
 
-    Two environment variables are required:
-    - LLAMA_STACK_TEST_INFERENCE_MODE: The mode to run in. Must be 'live', 'record', or 'replay'.
-    - LLAMA_STACK_TEST_RECORDING_DIR: The directory to store the recordings in.
+    Two environment variables are supported:
+    - LLAMA_STACK_TEST_INFERENCE_MODE: The mode to run in. Must be 'live', 'record', or 'replay'. Default is 'replay'.
+    - LLAMA_STACK_TEST_RECORDING_DIR: The directory to store the recordings in. Default is 'tests/integration/recordings'.
 
-    The recordings are stored in a SQLite database and a JSON file for each request. The SQLite database is used to
-    quickly find the correct recording for a given request. The JSON files are used to store the request and response
-    bodies.
+    The recordings are stored as JSON files.
     """
     mode = get_inference_mode()
-
-    if mode not in InferenceMode:
-        raise ValueError(f"Invalid LLAMA_STACK_TEST_INFERENCE_MODE: {mode}. Must be 'live', 'record', or 'replay'")
-
     if mode == InferenceMode.LIVE:
         return None
 
-    if "LLAMA_STACK_TEST_RECORDING_DIR" not in os.environ:
-        raise ValueError("LLAMA_STACK_TEST_RECORDING_DIR must be set for recording or replaying")
-    storage_dir = os.environ["LLAMA_STACK_TEST_RECORDING_DIR"]
-
+    storage_dir = os.environ.get("LLAMA_STACK_TEST_RECORDING_DIR", DEFAULT_STORAGE_DIR)
     return inference_recording(mode=mode, storage_dir=storage_dir)
 
 
@@ -134,8 +127,8 @@ class ResponseStorage:
     def store_recording(self, request_hash: str, request: dict[str, Any], response: dict[str, Any]):
         """Store a request/response pair."""
         # Generate unique response filename
-        response_file = f"{request_hash[:12]}.json"
-        response_path = self.responses_dir / response_file
+        short_hash = request_hash[:12]
+        response_file = f"{short_hash}.json"
 
         # Serialize response body if needed
         serialized_response = dict(response)
@@ -147,6 +140,14 @@ class ResponseStorage:
                 # Handle single response
                 serialized_response["body"] = _serialize_response(serialized_response["body"])
 
+        # If this is an Ollama /api/tags recording, include models digest in filename to distinguish variants
+        endpoint = request.get("endpoint")
+        if endpoint in ("/api/tags", "/v1/models"):
+            digest = _model_identifiers_digest(endpoint, response)
+            response_file = f"models-{short_hash}-{digest}.json"
+
+        response_path = self.responses_dir / response_file
+
         # Save response to JSON file
         with open(response_path, "w") as f:
             json.dump({"request": request, "response": serialized_response}, f, indent=2)
@@ -161,19 +162,85 @@ class ResponseStorage:
         if not response_path.exists():
             return None
 
-        with open(response_path) as f:
-            data = json.load(f)
+        return _recording_from_file(response_path)
 
-        # Deserialize response body if needed
-        if "response" in data and "body" in data["response"]:
-            if isinstance(data["response"]["body"], list):
-                # Handle streaming responses
-                data["response"]["body"] = [_deserialize_response(chunk) for chunk in data["response"]["body"]]
+    def _model_list_responses(self, short_hash: str) -> list[dict[str, Any]]:
+        results: list[dict[str, Any]] = []
+        for path in self.responses_dir.glob(f"models-{short_hash}-*.json"):
+            data = _recording_from_file(path)
+            results.append(data)
+        return results
+
+
+def _recording_from_file(response_path) -> dict[str, Any]:
+    with open(response_path) as f:
+        data = json.load(f)
+
+    # Deserialize response body if needed
+    if "response" in data and "body" in data["response"]:
+        if isinstance(data["response"]["body"], list):
+            # Handle streaming responses
+            data["response"]["body"] = [_deserialize_response(chunk) for chunk in data["response"]["body"]]
+        else:
+            # Handle single response
+            data["response"]["body"] = _deserialize_response(data["response"]["body"])
+
+    return cast(dict[str, Any], data)
+
+
+def _model_identifiers_digest(endpoint: str, response: dict[str, Any]) -> str:
+    def _extract_model_identifiers():
+        """Extract a stable set of identifiers for model-list endpoints.
+
+        Supported endpoints:
+        - '/api/tags' (Ollama): response body has 'models': [ { name/model/digest/id/... }, ... ]
+        - '/v1/models' (OpenAI): response body has 'data': [ { id: ... }, ... ]
+        Returns a list of unique identifiers or None if structure doesn't match.
+        """
+        body = response["body"]
+        if endpoint == "/api/tags":
+            items = body.get("models")
+            idents = [m.model for m in items]
+        else:
+            items = body.get("data")
+            idents = [m.id for m in items]
+        return sorted(set(idents))
+
+    identifiers = _extract_model_identifiers()
+    return hashlib.sha1(("|".join(identifiers)).encode("utf-8")).hexdigest()[:8]
+
+
+def _combine_model_list_responses(endpoint: str, records: list[dict[str, Any]]) -> dict[str, Any] | None:
+    """Return a single, unioned recording for supported model-list endpoints."""
+    seen: dict[str, dict[str, Any]] = {}
+    for rec in records:
+        body = rec["response"]["body"]
+        if endpoint == "/api/tags":
+            items = body.models
+        elif endpoint == "/v1/models":
+            items = body.data
+        else:
+            items = []
+
+        for m in items:
+            if endpoint == "/v1/models":
+                key = m.id
             else:
-                # Handle single response
-                data["response"]["body"] = _deserialize_response(data["response"]["body"])
+                key = m.model
+            seen[key] = m
 
-        return cast(dict[str, Any], data)
+    ordered = [seen[k] for k in sorted(seen.keys())]
+    canonical = records[0]
+    canonical_req = canonical.get("request", {})
+    if isinstance(canonical_req, dict):
+        canonical_req["endpoint"] = endpoint
+    if endpoint == "/v1/models":
+        body = {"data": ordered, "object": "list"}
+    else:
+        from ollama import ListResponse
+
+        body = ListResponse(models=ordered)
+    return {"request": canonical_req, "response": {"body": body, "is_streaming": False}}
 
 
 async def _patched_inference_method(original_method, self, client_type, endpoint, *args, **kwargs):
@@ -195,8 +262,6 @@ async def _patched_inference_method(original_method, self, client_type, endpoint
         raise ValueError(f"Unknown client type: {client_type}")
 
     url = base_url.rstrip("/") + endpoint
-
-    # Normalize request for matching
     method = "POST"
     headers = {}
     body = kwargs
@@ -204,7 +269,12 @@ async def _patched_inference_method(original_method, self, client_type, endpoint
     request_hash = normalize_request(method, url, headers, body)
 
     if _current_mode == InferenceMode.REPLAY:
-        recording = _current_storage.find_recording(request_hash)
+        # Special handling for model-list endpoints: return union of all responses
+        if endpoint in ("/api/tags", "/v1/models"):
+            records = _current_storage._model_list_responses(request_hash[:12])
+            recording = _combine_model_list_responses(endpoint, records)
+        else:
+            recording = _current_storage.find_recording(request_hash)
         if recording:
             response_body = recording["response"]["body"]
 
@@ -274,12 +344,14 @@ def patch_inference_clients():
     from openai.resources.chat.completions import AsyncCompletions as AsyncChatCompletions
     from openai.resources.completions import AsyncCompletions
     from openai.resources.embeddings import AsyncEmbeddings
+    from openai.resources.models import AsyncModels
 
     # Store original methods for both OpenAI and Ollama clients
     _original_methods = {
         "chat_completions_create": AsyncChatCompletions.create,
         "completions_create": AsyncCompletions.create,
         "embeddings_create": AsyncEmbeddings.create,
+        "models_list": AsyncModels.list,
         "ollama_generate": OllamaAsyncClient.generate,
         "ollama_chat": OllamaAsyncClient.chat,
         "ollama_embed": OllamaAsyncClient.embed,
@@ -304,10 +376,16 @@ def patch_inference_clients():
             _original_methods["embeddings_create"], self, "openai", "/v1/embeddings", *args, **kwargs
         )
 
+    async def patched_models_list(self, *args, **kwargs):
+        return await _patched_inference_method(
+            _original_methods["models_list"], self, "openai", "/v1/models", *args, **kwargs
+        )
+
     # Apply OpenAI patches
     AsyncChatCompletions.create = patched_chat_completions_create
     AsyncCompletions.create = patched_completions_create
     AsyncEmbeddings.create = patched_embeddings_create
+    AsyncModels.list = patched_models_list
 
     # Create patched methods for Ollama client
     async def patched_ollama_generate(self, *args, **kwargs):
@@ -361,11 +439,13 @@ def unpatch_inference_clients():
     from openai.resources.chat.completions import AsyncCompletions as AsyncChatCompletions
     from openai.resources.completions import AsyncCompletions
     from openai.resources.embeddings import AsyncEmbeddings
+    from openai.resources.models import AsyncModels
 
     # Restore OpenAI client methods
     AsyncChatCompletions.create = _original_methods["chat_completions_create"]
     AsyncCompletions.create = _original_methods["completions_create"]
     AsyncEmbeddings.create = _original_methods["embeddings_create"]
+    AsyncModels.list = _original_methods["models_list"]
 
     # Restore Ollama client methods if they were patched
     OllamaAsyncClient.generate = _original_methods["ollama_generate"]
@@ -379,16 +459,10 @@ def unpatch_inference_clients():
 
 
 @contextmanager
-def inference_recording(mode: str = "live", storage_dir: str | Path | None = None) -> Generator[None, None, None]:
+def inference_recording(mode: str, storage_dir: str | Path | None = None) -> Generator[None, None, None]:
     """Context manager for inference recording/replaying."""
     global _current_mode, _current_storage
 
-    # Set defaults
-    if storage_dir is None:
-        storage_dir_path = Path.home() / ".llama" / "recordings"
-    else:
-        storage_dir_path = Path(storage_dir)
-
     # Store previous state
     prev_mode = _current_mode
     prev_storage = _current_storage
@@ -397,7 +471,9 @@ def inference_recording(mode: str = "live", storage_dir: str | Path | None = Non
         _current_mode = mode
 
         if mode in ["record", "replay"]:
-            _current_storage = ResponseStorage(storage_dir_path)
+            if storage_dir is None:
+                raise ValueError("storage_dir is required for record and replay modes")
+            _current_storage = ResponseStorage(Path(storage_dir))
             patch_inference_clients()
 
         yield
diff --git a/scripts/integration-tests.sh b/scripts/integration-tests.sh
index e152444e1..104ba5cf3 100755
--- a/scripts/integration-tests.sh
+++ b/scripts/integration-tests.sh
@@ -140,13 +140,6 @@ THIS_DIR=$(dirname "$0")
 ROOT_DIR="$THIS_DIR/.."
 cd $ROOT_DIR
 
-# Set recording directory
-if [[ "$RUN_VISION_TESTS" == "true" ]]; then
-    export LLAMA_STACK_TEST_RECORDING_DIR="tests/integration/recordings/vision"
-else
-    export LLAMA_STACK_TEST_RECORDING_DIR="tests/integration/recordings"
-fi
-
 # check if "llama" and "pytest" are available. this script does not use `uv run` given
 # it can be used in a pre-release environment where we have not been able to tell
 # uv about pre-release dependencies properly (yet).
@@ -298,5 +291,12 @@ echo "=== System Resources After Tests ==="
 free -h 2>/dev/null || echo "free command not available"
 df -h
 
+# stop server
+if [[ "$STACK_CONFIG" == *"server:"* ]]; then
+    echo "Stopping Llama Stack Server..."
+    kill $(lsof -i :8321 | awk 'NR>1 {print $2}')
+    echo "Llama Stack Server stopped"
+fi
+
 echo ""
 echo "=== Integration Tests Complete ==="
diff --git a/tests/README.md b/tests/README.md
index 3b129fbd9..81f025f86 100644
--- a/tests/README.md
+++ b/tests/README.md
@@ -38,26 +38,15 @@ For running integration tests, you must provide a few things:
   - a distribution name (e.g., `starter`) or a path to a `run.yaml` file
   - a comma-separated list of api=provider pairs, e.g. `inference=fireworks,safety=llama-guard,agents=meta-reference`. This is most useful for testing a single API surface.
 
-- Whether you are using replay or live mode for inference. This is specified with the LLAMA_STACK_TEST_INFERENCE_MODE environment variable. The default mode currently is "live" -- that is certainly surprising, but we will fix this soon.
-
 - Any API keys you need to use should be set in the environment, or can be passed in with the --env option.
 
 You can run the integration tests in replay mode with:
 ```bash
 # Run all tests with existing recordings
-LLAMA_STACK_TEST_INFERENCE_MODE=replay \
-  LLAMA_STACK_TEST_RECORDING_DIR=tests/integration/recordings \
   uv run --group test \
   pytest -sv tests/integration/ --stack-config=starter
 ```
 
-If you don't specify LLAMA_STACK_TEST_INFERENCE_MODE, by default it will be in "live" mode -- that is, it will make real API calls.
-
-```bash
-# Test against live APIs
-FIREWORKS_API_KEY=your_key pytest -sv tests/integration/inference --stack-config=starter
-```
-
 ### Re-recording tests
 
 #### Local Re-recording (Manual Setup Required)
@@ -66,7 +55,6 @@ If you want to re-record tests locally, you can do so with:
 
 ```bash
 LLAMA_STACK_TEST_INFERENCE_MODE=record \
-  LLAMA_STACK_TEST_RECORDING_DIR=tests/integration/recordings \
   uv run --group test \
   pytest -sv tests/integration/ --stack-config=starter -k "<appropriate test name>"
 ```
diff --git a/tests/integration/README.md b/tests/integration/README.md
index 46d66fd79..d177cbebf 100644
--- a/tests/integration/README.md
+++ b/tests/integration/README.md
@@ -98,29 +98,25 @@ pytest -s -v tests/integration/vector_io/ \
 
 The testing system supports three modes controlled by environment variables:
 
-### LIVE Mode (Default)
-Tests make real API calls:
+### REPLAY Mode (Default)
+Uses cached responses instead of making API calls:
 ```bash
-LLAMA_STACK_TEST_INFERENCE_MODE=live pytest tests/integration/
+pytest tests/integration/
 ```
-
 ### RECORD Mode
 Captures API interactions for later replay:
 ```bash
 LLAMA_STACK_TEST_INFERENCE_MODE=record \
-LLAMA_STACK_TEST_RECORDING_DIR=tests/integration/recordings \
 pytest tests/integration/inference/test_new_feature.py
 ```
 
-### REPLAY Mode
-Uses cached responses instead of making API calls:
+### LIVE Mode
+Tests make real API calls (but not recorded):
 ```bash
-LLAMA_STACK_TEST_INFERENCE_MODE=replay \
-LLAMA_STACK_TEST_RECORDING_DIR=tests/integration/recordings \
-pytest tests/integration/
+LLAMA_STACK_TEST_INFERENCE_MODE=live pytest tests/integration/
 ```
 
-Note that right now you must specify the recording directory. This is because different tests use different recording directories and we don't (yet) have a fool-proof way to map a test to a recording directory. We are working on this.
+By default, the recording directory is `tests/integration/recordings`. You can override this by setting the `LLAMA_STACK_TEST_RECORDING_DIR` environment variable.
 
 ## Managing Recordings
 
@@ -146,7 +142,6 @@ See the [main testing guide](../README.md#remote-re-recording-recommended) for f
 ```bash
 # Re-record specific tests
 LLAMA_STACK_TEST_INFERENCE_MODE=record \
-LLAMA_STACK_TEST_RECORDING_DIR=tests/integration/recordings \
 pytest -s -v --stack-config=server:starter tests/integration/inference/test_modified.py
 ```
 
diff --git a/tests/integration/recordings/responses/00ba04f74a96.json b/tests/integration/recordings/responses/00ba04f74a96.json
index d2e482d76..642c58414 100644
--- a/tests/integration/recordings/responses/00ba04f74a96.json
+++ b/tests/integration/recordings/responses/00ba04f74a96.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:53.860911Z",
+        "created_at": "2025-09-03T17:37:35.23084Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 249137667,
-        "load_duration": 152509542,
+        "total_duration": 195981375,
+        "load_duration": 110522917,
         "prompt_eval_count": 216,
-        "prompt_eval_duration": 71000000,
+        "prompt_eval_duration": 72393958,
         "eval_count": 2,
-        "eval_duration": 24000000,
+        "eval_duration": 11843000,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/04172112ffbb.json b/tests/integration/recordings/responses/04172112ffbb.json
index bf94b0697..da5f58a50 100644
--- a/tests/integration/recordings/responses/04172112ffbb.json
+++ b/tests/integration/recordings/responses/04172112ffbb.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:18.033900164Z",
+          "created_at": "2025-09-03T17:41:43.950283Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:18.213371151Z",
+          "created_at": "2025-09-03T17:41:43.991122Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:18.387513976Z",
+          "created_at": "2025-09-03T17:41:44.031378Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:18.564344287Z",
+          "created_at": "2025-09-03T17:41:44.073098Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:18.746579415Z",
+          "created_at": "2025-09-03T17:41:44.115961Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:18.923276047Z",
+          "created_at": "2025-09-03T17:41:44.156517Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:19.099961963Z",
+          "created_at": "2025-09-03T17:41:44.197079Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:19.275621884Z",
+          "created_at": "2025-09-03T17:41:44.237565Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:19.452204196Z",
+          "created_at": "2025-09-03T17:41:44.277755Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:19.626937514Z",
+          "created_at": "2025-09-03T17:41:44.318476Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,7 +201,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:19.805566767Z",
+          "created_at": "2025-09-03T17:41:44.358628Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -219,7 +219,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:19.985987477Z",
+          "created_at": "2025-09-03T17:41:44.398984Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -237,7 +237,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:20.166458601Z",
+          "created_at": "2025-09-03T17:41:44.439232Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -255,7 +255,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:20.343346795Z",
+          "created_at": "2025-09-03T17:41:44.479478Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -273,7 +273,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:20.525008091Z",
+          "created_at": "2025-09-03T17:41:44.520202Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -291,7 +291,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:20.709087695Z",
+          "created_at": "2025-09-03T17:41:44.560517Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -309,7 +309,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:20.887074305Z",
+          "created_at": "2025-09-03T17:41:44.601592Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -327,15 +327,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:21.065244925Z",
+          "created_at": "2025-09-03T17:41:44.642064Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 4373531496,
-          "load_duration": 44438132,
+          "total_duration": 887142667,
+          "load_duration": 119331417,
           "prompt_eval_count": 56,
-          "prompt_eval_duration": 1296273199,
+          "prompt_eval_duration": 74294709,
           "eval_count": 18,
-          "eval_duration": 3032321735,
+          "eval_duration": 692842791,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/0b27fd737699.json b/tests/integration/recordings/responses/0b27fd737699.json
index e20c65c75..e25cde820 100644
--- a/tests/integration/recordings/responses/0b27fd737699.json
+++ b/tests/integration/recordings/responses/0b27fd737699.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:13:57.556416Z",
+        "created_at": "2025-09-03T17:37:47.461886Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 432363250,
-        "load_duration": 159296417,
+        "total_duration": 338927833,
+        "load_duration": 100895125,
         "prompt_eval_count": 223,
-        "prompt_eval_duration": 257000000,
+        "prompt_eval_duration": 221583042,
         "eval_count": 2,
-        "eval_duration": 14000000,
+        "eval_duration": 12341416,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/0b3f2e4754ff.json b/tests/integration/recordings/responses/0b3f2e4754ff.json
index 28e923e9c..8496deeb0 100644
--- a/tests/integration/recordings/responses/0b3f2e4754ff.json
+++ b/tests/integration/recordings/responses/0b3f2e4754ff.json
@@ -24,7 +24,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -39,7 +39,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921333,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -50,7 +50,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -65,7 +65,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921333,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -76,7 +76,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -91,7 +91,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921333,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -102,7 +102,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -117,7 +117,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921333,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -128,7 +128,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -143,7 +143,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921334,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -154,7 +154,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -169,7 +169,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921334,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -180,7 +180,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -195,7 +195,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921334,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -206,7 +206,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
           "choices": [
             {
               "delta": {
@@ -221,7 +221,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090031,
+          "created": 1756921334,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/0e8f2b001dd9.json b/tests/integration/recordings/responses/0e8f2b001dd9.json
index 7c5973fae..6bcdfdfed 100644
--- a/tests/integration/recordings/responses/0e8f2b001dd9.json
+++ b/tests/integration/recordings/responses/0e8f2b001dd9.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-368",
+        "id": "chatcmpl-161",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "Saturn is known for its extensive ring system.",
+              "content": "The answer is Saturn.",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,15 +37,15 @@
             }
           }
         ],
-        "created": 1754081853,
+        "created": 1756921364,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 11,
+          "completion_tokens": 6,
           "prompt_tokens": 39,
-          "total_tokens": 50,
+          "total_tokens": 45,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/10eea8c15ddc.json b/tests/integration/recordings/responses/10eea8c15ddc.json
index 71496da9a..bc608ef09 100644
--- a/tests/integration/recordings/responses/10eea8c15ddc.json
+++ b/tests/integration/recordings/responses/10eea8c15ddc.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:51.682357Z",
+        "created_at": "2025-09-03T17:37:33.473237Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 238161000,
-        "load_duration": 72494750,
+        "total_duration": 279025042,
+        "load_duration": 162673250,
         "prompt_eval_count": 212,
-        "prompt_eval_duration": 87000000,
+        "prompt_eval_duration": 73595834,
         "eval_count": 5,
-        "eval_duration": 74000000,
+        "eval_duration": 41950291,
         "response": "unsafe\nS8",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/140187e305dc.json b/tests/integration/recordings/responses/140187e305dc.json
index 44d00c96f..69b9712eb 100644
--- a/tests/integration/recordings/responses/140187e305dc.json
+++ b/tests/integration/recordings/responses/140187e305dc.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-876",
+        "id": "chatcmpl-974",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "I'm afraid I don't have a built-in ability to directly interface with or \"test\" OpenAI models, including the original GPT-1 model. However, I can explain how you might approach this task:\n\nThe OpenAI GPT-1 is a large transformer-based language model that was trained on a massive dataset of text and achieved state-of-the-art results in various natural language processing tasks.\n\nTo test or evaluate the performance of a model like GPT-1, you would typically follow these steps:\n\n1. **Get access to the OpenAI API**: The OpenAI API provides a way for developers to interact with the GPT-1 model programmatically. You can sign up for an API key on the OpenAI website.\n2. **Choose a testing platform or environment**: You'll need a compute platform that supports the necessary algorithms and data structures to run inference on the GPT-1 model. Some popular options include AWS, Google Cloud, or Azure Compute Virtual Machines.\n3. **Prepare your test input data**: This will involve creating text inputs in the format expected by the OpenAI API (i.e., a JSON object containing the text to be processed).\n4. **Use the OpenAI Python library or SDK**: The OpenAI Python library provides an easy-to-use interface for interacting with the GPT-1 model through the API.\n\nHere's some example code that demonstrates how you might use the OpenAI Flask API to test a single input:\n\n```python\nfrom flask import Flask, request, jsonify\nimport json\n\napp = Flask(__name__)\n\n@ app . route ( '/ /gpt-en ', ' Text ', methods = ['POST'])\ndef gpt_en () -> Json :\n    data = request . get_json ()\n    if not data or \"message\" in ( data ):\n        return None , 400 , { ' error' : \"Input must be a text string.\" }\n    response = []\n    while True:\n        message = \"\"\n        for token in data [\"input\"]:\n            response_text = f\"{data['prompt']} {token}\"\n            data[\"input\"] = [response_text]\n            new_response = gpt_en()(data)\n            if all([not item or not isinstance(item, dict) for item in new_response]):\n             break\n\n        message = json . dumps ({}\"text\": response_text})\n        response.append(message)\n\n    return jsonify ({\"output\": response}), 200 , {}\n\nif __name__ == \"__main__\":\n   app.run(debug=True)\n```\n\n5. **Evaluate the output**: Once you have processed your test input data using the GPT-1 model, you can evaluate the accuracy of the generated responses.\n\nKeep in mind that this is just a basic example to illustrate how you might approach testing the OpenAI GPT-1 model.",
+              "content": "I'm happy to help you test the OpenAI API, however I can not access the API.\n\nInstead why don't we follow these steps:\n\n*   Check documentation\n*   Contact support\n*   Reach out to their community forum. \n\nLet me know if I can be of any additional assistance",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,15 +37,15 @@
             }
           }
         ],
-        "created": 1754510050,
+        "created": 1756921202,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 567,
+          "completion_tokens": 61,
           "prompt_tokens": 31,
-          "total_tokens": 598,
+          "total_tokens": 92,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/17253d7cc667.json b/tests/integration/recordings/responses/17253d7cc667.json
index 1013a8b08..290c0395b 100644
--- a/tests/integration/recordings/responses/17253d7cc667.json
+++ b/tests/integration/recordings/responses/17253d7cc667.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:52.919624Z",
+        "created_at": "2025-09-03T17:37:34.308033Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 201956834,
-        "load_duration": 105132584,
+        "total_duration": 200296000,
+        "load_duration": 115974708,
         "prompt_eval_count": 212,
-        "prompt_eval_duration": 75000000,
+        "prompt_eval_duration": 72173459,
         "eval_count": 2,
-        "eval_duration": 20000000,
+        "eval_duration": 11536750,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/173ecb3aab28.json b/tests/integration/recordings/responses/173ecb3aab28.json
index bc550edd5..0c29b278b 100644
--- a/tests/integration/recordings/responses/173ecb3aab28.json
+++ b/tests/integration/recordings/responses/173ecb3aab28.json
@@ -40,7 +40,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -55,7 +55,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -66,7 +66,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -81,7 +81,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -92,7 +92,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -107,7 +107,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -118,7 +118,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -133,7 +133,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -144,7 +144,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -159,7 +159,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -170,7 +170,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -185,7 +185,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -196,7 +196,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -211,7 +211,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -222,7 +222,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-457",
+          "id": "chatcmpl-921",
           "choices": [
             {
               "delta": {
@@ -237,7 +237,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754090032,
+          "created": 1756920971,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/174458ad71b2.json b/tests/integration/recordings/responses/174458ad71b2.json
index 2dcb85262..ba99d54e6 100644
--- a/tests/integration/recordings/responses/174458ad71b2.json
+++ b/tests/integration/recordings/responses/174458ad71b2.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:53.580806Z",
+        "created_at": "2025-09-03T17:37:34.994704Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 205732750,
-        "load_duration": 98967000,
+        "total_duration": 339570875,
+        "load_duration": 262794125,
         "prompt_eval_count": 213,
-        "prompt_eval_duration": 86000000,
+        "prompt_eval_duration": 64061000,
         "eval_count": 2,
-        "eval_duration": 18000000,
+        "eval_duration": 11839042,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/178016edef0e.json b/tests/integration/recordings/responses/178016edef0e.json
index be545c221..83746aa33 100644
--- a/tests/integration/recordings/responses/178016edef0e.json
+++ b/tests/integration/recordings/responses/178016edef0e.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:52.354566Z",
+        "created_at": "2025-09-03T17:37:33.769233Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 605192500,
-        "load_duration": 457087166,
+        "total_duration": 253836584,
+        "load_duration": 138624959,
         "prompt_eval_count": 210,
-        "prompt_eval_duration": 63000000,
+        "prompt_eval_duration": 69496125,
         "eval_count": 5,
-        "eval_duration": 84000000,
+        "eval_duration": 45062833,
         "response": "unsafe\nS12",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/197228e26971.json b/tests/integration/recordings/responses/197228e26971.json
index 6c1730df2..4fa9e2126 100644
--- a/tests/integration/recordings/responses/197228e26971.json
+++ b/tests/integration/recordings/responses/197228e26971.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:52.686478Z",
+        "created_at": "2025-09-03T17:37:34.074233Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 304136208,
-        "load_duration": 155977000,
+        "total_duration": 270746375,
+        "load_duration": 156423042,
         "prompt_eval_count": 213,
-        "prompt_eval_duration": 71000000,
+        "prompt_eval_duration": 70338083,
         "eval_count": 5,
-        "eval_duration": 76000000,
+        "eval_duration": 43379167,
         "response": "unsafe\nS2",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/198ef7208389.json b/tests/integration/recordings/responses/198ef7208389.json
index b196d3be2..f0f9d6a7d 100644
--- a/tests/integration/recordings/responses/198ef7208389.json
+++ b/tests/integration/recordings/responses/198ef7208389.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:51.186501Z",
+        "created_at": "2025-09-03T17:37:32.84197Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 3146184459,
-        "load_duration": 2533467917,
+        "total_duration": 21572898667,
+        "load_duration": 21155275042,
         "prompt_eval_count": 212,
-        "prompt_eval_duration": 526000000,
+        "prompt_eval_duration": 371898125,
         "eval_count": 5,
-        "eval_duration": 83000000,
+        "eval_duration": 43290458,
         "response": "unsafe\nS1",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/1adfaa0e062e.json b/tests/integration/recordings/responses/1adfaa0e062e.json
index 5a3d44394..253c230d9 100644
--- a/tests/integration/recordings/responses/1adfaa0e062e.json
+++ b/tests/integration/recordings/responses/1adfaa0e062e.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:53.332041Z",
+        "created_at": "2025-09-03T17:37:34.607413Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 365895333,
-        "load_duration": 257825208,
+        "total_duration": 267812042,
+        "load_duration": 181570000,
         "prompt_eval_count": 213,
-        "prompt_eval_duration": 78000000,
+        "prompt_eval_duration": 73947375,
         "eval_count": 2,
-        "eval_duration": 28000000,
+        "eval_duration": 11708000,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/1b8394f90636.json b/tests/integration/recordings/responses/1b8394f90636.json
index f5885805b..6857c6840 100644
--- a/tests/integration/recordings/responses/1b8394f90636.json
+++ b/tests/integration/recordings/responses/1b8394f90636.json
@@ -22,15 +22,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-08-04T22:55:05.685988Z",
+        "created_at": "2025-09-03T17:36:13.821929Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 14128980625,
-        "load_duration": 7220159208,
+        "total_duration": 1907912167,
+        "load_duration": 90979292,
         "prompt_eval_count": 18,
-        "prompt_eval_duration": 4658000000,
+        "prompt_eval_duration": 77350291,
         "eval_count": 43,
-        "eval_duration": 2224000000,
+        "eval_duration": 1738568334,
         "response": " _______.\n\nThe best answer is blue. The traditional nursery rhyme goes like this:\n\nRoses are red,\nViolets are blue,\nSugar is sweet,\nAnd so are you! (Or something similar.)",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/1b92be674e2a.json b/tests/integration/recordings/responses/1b92be674e2a.json
index 2ed061949..e5f05bf54 100644
--- a/tests/integration/recordings/responses/1b92be674e2a.json
+++ b/tests/integration/recordings/responses/1b92be674e2a.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-07-31T17:50:06.140190726Z",
+        "created_at": "2025-09-03T17:39:38.236797Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 5213341378,
-        "load_duration": 43943569,
+        "total_duration": 1296281500,
+        "load_duration": 283393917,
         "prompt_eval_count": 23,
-        "prompt_eval_duration": 1049424427,
+        "prompt_eval_duration": 75453042,
         "eval_count": 24,
-        "eval_duration": 4119422888,
+        "eval_duration": 936860125,
         "response": "Mark Zuckerberg is the founder, chairman and CEO of Meta, which he originally founded as Facebook in 2004.",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/1e11c2b20ff8.json b/tests/integration/recordings/responses/1e11c2b20ff8.json
index 98e855fdf..6131b1d5e 100644
--- a/tests/integration/recordings/responses/1e11c2b20ff8.json
+++ b/tests/integration/recordings/responses/1e11c2b20ff8.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              0.042499725,
-              -0.061890375,
-              -0.07846951,
-              0.006408736,
-              0.031287834,
-              0.008066364,
-              0.058032244,
-              0.025457833,
-              0.016401615,
-              0.04601607,
-              -0.028947692,
-              0.04452766,
-              0.056886304,
-              -0.0153307365,
-              -0.070184045,
-              -0.057157565,
-              -0.0768682,
-              0.0067744707,
-              0.0043326365,
-              -0.1236485,
-              0.0031424984,
-              -0.032562014,
-              -0.029376298,
-              0.024144078,
-              -0.028531333,
-              0.102257624,
-              0.0021518522,
-              -0.0069792354,
-              0.02530627,
-              -0.055496883,
-              0.031227645,
-              -0.0070384145,
-              0.08432449,
-              -0.028390806,
-              -0.083012834,
-              0.009549195,
-              -0.020060178,
-              -0.00240923,
-              -0.007700305,
-              -0.023067193,
-              -0.092922784,
-              -0.04261493,
-              -0.019990565,
-              0.008238936,
-              0.060982026,
-              0.05032288,
-              -0.051029027,
-              -0.008544468,
-              -0.030194579,
-              -0.035787255,
-              -0.17837463,
-              -0.047271743,
-              0.033892605,
-              0.031609993,
-              -0.0088130655,
-              0.10480617,
-              0.03355418,
-              0.09033605,
-              -0.01574583,
-              -0.012574861,
-              -0.08468548,
-              -0.114774585,
-              -0.13755703,
-              0.021649128,
-              0.047812033,
-              0.043242246,
-              0.008644588,
-              0.03873661,
-              0.046728984,
-              -0.07743038,
-              -0.0488837,
-              0.031276364,
-              0.022359744,
-              0.00040771137,
-              0.05229871,
-              -0.012229048,
-              -0.035172377,
-              -0.008257451,
-              -0.0088830395,
-              -0.034264818,
-              -0.045780584,
-              0.0024807125,
-              -0.040849846,
-              0.080489986,
-              0.09471281,
-              0.041345056,
-              0.005824089,
-              0.04501066,
-              0.025380718,
-              0.006616412,
-              0.010480027,
-              -0.07959875,
-              -0.03109039,
-              -0.035281006,
-              0.018305738,
-              0.053488795,
-              0.06565703,
-              -0.07258639,
-              0.025227,
-              0.10518925,
-              0.035734728,
-              0.02812301,
-              0.0116889635,
-              0.04420422,
-              0.012585445,
-              0.0018629873,
-              0.03925016,
-              0.043145437,
-              0.097845145,
-              -0.08803666,
-              -0.060626414,
-              0.026821595,
-              0.0041026343,
-              0.033468857,
-              0.011819169,
-              0.009573708,
-              -0.009524407,
-              -0.021213718,
-              -0.008906247,
-              0.029348776,
-              -0.012694493,
-              -0.019262077,
-              0.009897482,
-              -0.008127538,
-              0.018616533,
-              -0.00074092194,
-              -0.056122895,
-              -3.8021082e-33,
-              0.020863937,
-              0.0047333767,
-              0.019744372,
-              0.060233314,
-              -0.06857584,
-              -0.07498767,
-              0.007997102,
-              -0.04733539,
-              0.05782872,
-              0.049535874,
-              0.018785646,
-              0.032732572,
-              0.017672436,
-              0.074836925,
-              0.024971113,
-              -0.011844539,
-              -0.11211646,
-              0.007026034,
-              0.028080462,
-              -0.017474122,
-              0.0817653,
-              -0.007904061,
-              0.03210623,
-              -0.122978985,
-              0.03375521,
-              0.02587286,
-              -0.004479943,
-              0.07948923,
-              0.004065995,
-              0.033063736,
-              0.008058094,
-              0.013444748,
-              -0.032908894,
-              0.031558145,
-              0.040147394,
-              0.001501024,
-              0.030767068,
-              0.029500617,
-              0.041341957,
-              -0.047430623,
-              0.039448265,
-              -0.075250365,
-              0.037944954,
-              -0.026018769,
-              0.016939783,
-              0.013666865,
-              0.007116529,
-              -0.053848118,
-              -0.074419044,
-              -0.006100011,
-              0.024430456,
-              -0.03985037,
-              -0.02065548,
-              -0.033364378,
-              0.008992889,
-              0.12111313,
-              -0.028268464,
-              -0.03619572,
-              -0.021325285,
-              0.05334936,
-              0.051584847,
-              -0.01202104,
-              0.03557552,
-              0.054104213,
-              0.06071252,
-              0.071583234,
-              0.042997945,
-              0.008561662,
-              0.07422672,
-              0.008418425,
-              -0.036365964,
-              -0.008559546,
-              -0.08816671,
-              -0.04907638,
-              0.00028750877,
-              -0.051279917,
-              0.035895903,
-              -0.030404305,
-              -0.012635731,
-              0.018795075,
-              0.017144373,
-              -0.06645754,
-              0.023793342,
-              0.000993731,
-              -0.01938052,
-              -0.05343233,
-              -0.017068349,
-              -0.06219081,
-              -0.059607625,
-              -0.012196407,
-              -0.0131753115,
-              -0.03705957,
-              0.0008210978,
-              0.09808552,
-              0.024671523,
-              2.1774687e-33,
-              -0.010076338,
-              -0.016777446,
-              -0.042147383,
-              0.08836867,
-              -0.028899672,
-              -0.0048874663,
-              -0.08209485,
-              0.029246984,
-              -0.04308444,
-              -0.014178017,
-              -0.028403133,
-              0.025991142,
-              -0.017637307,
-              0.04654231,
-              -0.0057748524,
-              0.029987331,
-              0.011357778,
-              0.017457604,
-              0.055051018,
-              0.03222884,
-              -0.07999247,
-              0.032465667,
-              -0.060007077,
-              -0.011553406,
-              0.010223051,
-              0.04651086,
-              0.0011846055,
-              0.07870393,
-              -0.044612467,
-              0.032810863,
-              0.0023138348,
-              -0.03884047,
-              -0.017668914,
-              0.079135194,
-              -0.004594527,
-              0.043508377,
-              -0.031625524,
-              0.008872064,
-              -0.050121736,
-              0.06896808,
-              0.043688085,
-              0.019938715,
-              -0.08469436,
-              -0.046897292,
-              -0.006832939,
-              -0.026140738,
-              -0.05106749,
-              0.054356705,
-              0.030691773,
-              -0.010932293,
-              0.047189884,
-              -0.01740432,
-              -0.020789616,
-              -0.08175918,
-              -0.027700473,
-              0.035974283,
-              0.05395729,
-              0.04489479,
-              0.059698317,
-              0.041220855,
-              -0.066653565,
-              -0.09200203,
-              0.008937433,
-              0.02581428,
-              -0.03863856,
-              -0.0043950165,
-              -0.05208163,
-              0.02743701,
-              0.012093444,
-              0.048299577,
-              0.059836566,
-              0.09734695,
-              -0.053629622,
-              -0.07637932,
-              0.015765766,
-              -0.044513486,
-              -0.13213192,
-              -0.07024786,
-              -0.10133136,
-              -0.11906537,
-              -0.027716314,
-              0.0068639666,
-              -0.0053682425,
-              0.054165307,
-              -0.11115557,
-              0.07837099,
-              0.03506696,
-              0.016077982,
-              0.021501223,
-              -0.061516896,
-              0.007429458,
-              0.048352152,
-              -0.013604487,
-              0.012456823,
-              -0.12730241,
-              -1.40081795e-08,
-              -0.040906876,
-              -0.015950777,
-              0.060046297,
-              0.038068157,
-              0.066364,
-              0.04727011,
-              -0.01611309,
-              0.09689113,
-              -0.044232138,
-              -0.028793652,
-              -0.012945379,
-              0.01303288,
-              0.022385143,
-              0.047113802,
-              0.06399741,
-              0.12131601,
-              0.060635034,
-              0.102205545,
-              -0.07575499,
-              -0.02380431,
-              0.12489149,
-              -0.045490686,
-              0.09547224,
-              0.021274548,
-              0.0373141,
-              -0.07523771,
-              -0.0026329542,
-              0.047245234,
-              0.048495702,
-              0.12357625,
-              0.018002188,
-              0.013794,
-              -0.03588812,
-              -0.05179344,
-              0.061835315,
-              0.051598098,
-              0.008910207,
-              -0.12502904,
-              0.016457288,
-              -0.08591687,
-              -0.07110172,
-              0.06984138,
-              -0.036050156,
-              -0.005367899,
-              -0.048767615,
-              0.0008031624,
-              -0.021520091,
-              -0.061076768,
-              0.002495028,
-              -0.032736864,
-              0.045757275,
-              0.0389445,
-              -0.024670867,
-              0.025894105,
-              0.10298855,
-              -0.01300183,
-              0.04781103,
-              -0.071152866,
-              0.04602928,
-              0.08051811,
-              -0.10304887,
-              0.0844638,
-              0.028001137,
-              -0.036985613
+              0.042460807,
+              -0.06189971,
+              -0.0784711,
+              0.0064329687,
+              0.03129365,
+              0.00807445,
+              0.05801836,
+              0.025447326,
+              0.016402787,
+              0.045995634,
+              -0.028924342,
+              0.04451832,
+              0.05686613,
+              -0.015340794,
+              -0.07020505,
+              -0.057178136,
+              -0.07683263,
+              0.006748679,
+              0.0043323045,
+              -0.123651944,
+              0.0031534543,
+              -0.03258051,
+              -0.02936216,
+              0.024140852,
+              -0.028559243,
+              0.10224467,
+              0.0021632623,
+              -0.006975691,
+              0.025292527,
+              -0.055500276,
+              0.031231727,
+              -0.0070274337,
+              0.08430815,
+              -0.028431177,
+              -0.083029,
+              0.009555893,
+              -0.020029299,
+              -0.00243229,
+              -0.00768719,
+              -0.023077851,
+              -0.09293533,
+              -0.042625993,
+              -0.020000124,
+              0.008240663,
+              0.060970567,
+              0.050315727,
+              -0.0510085,
+              -0.008543903,
+              -0.030227834,
+              -0.03582846,
+              -0.17836656,
+              -0.047279052,
+              0.033892106,
+              0.031623542,
+              -0.008832113,
+              0.10480918,
+              0.033559043,
+              0.090348184,
+              -0.015757555,
+              -0.0125672715,
+              -0.084686965,
+              -0.114781834,
+              -0.13755985,
+              0.021652374,
+              0.047834594,
+              0.043243896,
+              0.008659893,
+              0.038724966,
+              0.046716973,
+              -0.077413626,
+              -0.04887495,
+              0.031287406,
+              0.022356613,
+              0.00043283988,
+              0.052321073,
+              -0.012254071,
+              -0.035172574,
+              -0.00825216,
+              -0.008866574,
+              -0.034267236,
+              -0.04576201,
+              0.002467568,
+              -0.040877618,
+              0.08047682,
+              0.09472728,
+              0.0413438,
+              0.0057974122,
+              0.044982508,
+              0.025369909,
+              0.006618073,
+              0.010467276,
+              -0.07960384,
+              -0.03108485,
+              -0.03528749,
+              0.01831391,
+              0.053473305,
+              0.06568304,
+              -0.07259002,
+              0.02523736,
+              0.10520362,
+              0.035732146,
+              0.028157586,
+              0.011687256,
+              0.044207197,
+              0.012604437,
+              0.0018819098,
+              0.03926183,
+              0.043135095,
+              0.09784739,
+              -0.08801336,
+              -0.06060836,
+              0.02681984,
+              0.0041358666,
+              0.033492945,
+              0.011799116,
+              0.009551661,
+              -0.0095491735,
+              -0.021212189,
+              -0.008917248,
+              0.029352615,
+              -0.012693442,
+              -0.019269384,
+              0.009901157,
+              -0.00812101,
+              0.018603146,
+              -0.0007501193,
+              -0.056115113,
+              -3.8018077e-33,
+              0.020848714,
+              0.0047160466,
+              0.019726405,
+              0.06024251,
+              -0.0685974,
+              -0.07497267,
+              0.007997452,
+              -0.047339544,
+              0.057801835,
+              0.049544968,
+              0.01878086,
+              0.03274472,
+              0.017663997,
+              0.07483022,
+              0.02496901,
+              -0.011843339,
+              -0.11212756,
+              0.0070379525,
+              0.028099466,
+              -0.01746246,
+              0.08173482,
+              -0.007920462,
+              0.032095373,
+              -0.12300146,
+              0.033773854,
+              0.025873141,
+              -0.0045020077,
+              0.079493225,
+              0.0040725255,
+              0.03305898,
+              0.008061117,
+              0.0134422695,
+              -0.03292251,
+              0.031554114,
+              0.04013794,
+              0.0014983519,
+              0.030762345,
+              0.029481992,
+              0.041350223,
+              -0.047438618,
+              0.03944708,
+              -0.07526981,
+              0.037927423,
+              -0.026016014,
+              0.016933467,
+              0.0136799775,
+              0.0071263947,
+              -0.05386736,
+              -0.07443268,
+              -0.006070775,
+              0.024427462,
+              -0.039844982,
+              -0.020661902,
+              -0.033354662,
+              0.009005565,
+              0.12111172,
+              -0.028260944,
+              -0.036192853,
+              -0.021332363,
+              0.05333571,
+              0.05161245,
+              -0.01204843,
+              0.035563566,
+              0.05408247,
+              0.060722187,
+              0.07159865,
+              0.04299143,
+              0.008544481,
+              0.07421879,
+              0.00841512,
+              -0.036342908,
+              -0.008549791,
+              -0.08816386,
+              -0.049075164,
+              0.00029373015,
+              -0.05127952,
+              0.03586739,
+              -0.030380003,
+              -0.012642127,
+              0.018771531,
+              0.01711824,
+              -0.06644723,
+              0.023793438,
+              0.0010271219,
+              -0.01939443,
+              -0.053452212,
+              -0.017060323,
+              -0.062207118,
+              -0.05962535,
+              -0.012172617,
+              -0.013190802,
+              -0.037036054,
+              0.00082622556,
+              0.098088354,
+              0.024690514,
+              2.1767905e-33,
+              -0.010088812,
+              -0.016811697,
+              -0.042140447,
+              0.08837209,
+              -0.028899776,
+              -0.0048947735,
+              -0.082139015,
+              0.029238816,
+              -0.043079354,
+              -0.014153092,
+              -0.028387645,
+              0.025998218,
+              -0.017625,
+              0.046511114,
+              -0.005768211,
+              0.030010609,
+              0.011375536,
+              0.017426634,
+              0.055062976,
+              0.032230247,
+              -0.07995765,
+              0.032486655,
+              -0.060016844,
+              -0.011561194,
+              0.010211269,
+              0.046528235,
+              0.001191399,
+              0.0786961,
+              -0.0446158,
+              0.032789085,
+              0.0023115936,
+              -0.03886269,
+              -0.017663589,
+              0.07913024,
+              -0.004583343,
+              0.043521065,
+              -0.031589273,
+              0.008867868,
+              -0.05013296,
+              0.068929516,
+              0.043675046,
+              0.019968731,
+              -0.08471742,
+              -0.046864275,
+              -0.0068198936,
+              -0.026138468,
+              -0.05107216,
+              0.054374695,
+              0.03069186,
+              -0.010925094,
+              0.04721093,
+              -0.017387696,
+              -0.020754937,
+              -0.081763394,
+              -0.027709637,
+              0.035980806,
+              0.05396534,
+              0.044874854,
+              0.059699643,
+              0.041227758,
+              -0.06664364,
+              -0.09201654,
+              0.008915574,
+              0.025849758,
+              -0.038651932,
+              -0.0044070315,
+              -0.052066546,
+              0.027435115,
+              0.012089562,
+              0.048306923,
+              0.059854515,
+              0.097325735,
+              -0.053612895,
+              -0.07639326,
+              0.015773866,
+              -0.0444848,
+              -0.13214406,
+              -0.0702488,
+              -0.10134438,
+              -0.11905995,
+              -0.027714504,
+              0.006891868,
+              -0.0053650527,
+              0.054135524,
+              -0.111159205,
+              0.07835098,
+              0.03506018,
+              0.016036613,
+              0.021490784,
+              -0.061526407,
+              0.007425222,
+              0.04833579,
+              -0.01361202,
+              0.012450488,
+              -0.12729599,
+              -1.4009424e-08,
+              -0.040908325,
+              -0.01596458,
+              0.060048707,
+              0.03804525,
+              0.0663794,
+              0.04727275,
+              -0.016112225,
+              0.09687414,
+              -0.04424251,
+              -0.028799534,
+              -0.01294642,
+              0.013026413,
+              0.022404836,
+              0.04713173,
+              0.06402557,
+              0.12130648,
+              0.06062839,
+              0.10218965,
+              -0.0757528,
+              -0.023806982,
+              0.12489501,
+              -0.045460615,
+              0.09545599,
+              0.021262301,
+              0.03731495,
+              -0.075220875,
+              -0.0026194793,
+              0.0472452,
+              0.048499025,
+              0.12358729,
+              0.017998053,
+              0.013811017,
+              -0.035893846,
+              -0.051789004,
+              0.06182457,
+              0.05160056,
+              0.008895317,
+              -0.12500942,
+              0.016453298,
+              -0.08590811,
+              -0.071096726,
+              0.06987216,
+              -0.036072273,
+              -0.0053715096,
+              -0.048762616,
+              0.00081640907,
+              -0.021502526,
+              -0.061078615,
+              0.002485032,
+              -0.032720752,
+              0.045743283,
+              0.038934175,
+              -0.024666062,
+              0.025897244,
+              0.10301431,
+              -0.013001504,
+              0.04783332,
+              -0.07114252,
+              0.046031926,
+              0.080549754,
+              -0.10302451,
+              0.08449227,
+              0.028010191,
+              -0.03697792
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/211b1562d4e6.json b/tests/integration/recordings/responses/211b1562d4e6.json
index ba254a166..2d0044e27 100644
--- a/tests/integration/recordings/responses/211b1562d4e6.json
+++ b/tests/integration/recordings/responses/211b1562d4e6.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-08-04T22:55:11.15982Z",
+        "created_at": "2025-09-03T17:36:17.894986Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 498612042,
-        "load_duration": 71411834,
+        "total_duration": 363397458,
+        "load_duration": 86692791,
         "prompt_eval_count": 23,
-        "prompt_eval_duration": 102000000,
+        "prompt_eval_duration": 68658541,
         "eval_count": 6,
-        "eval_duration": 323000000,
+        "eval_duration": 207389084,
         "response": "Humans live on Earth.",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/23506e73bb9e.json b/tests/integration/recordings/responses/23506e73bb9e.json
index d6e34c3f9..20ec9f1d1 100644
--- a/tests/integration/recordings/responses/23506e73bb9e.json
+++ b/tests/integration/recordings/responses/23506e73bb9e.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.055977955,
-              0.075997174,
-              -0.09249559,
-              0.014318654,
-              0.05876127,
-              -0.032458965,
-              0.020946832,
-              0.028819378,
-              -0.06590933,
-              0.013517223,
-              0.13000485,
-              0.0045786807,
-              -0.0069082035,
-              -0.055431433,
-              -0.04756826,
-              -0.02912152,
-              -0.12239366,
-              -0.05359766,
-              -0.014712379,
-              0.059826344,
-              0.034466766,
-              0.02072927,
-              -0.048724595,
-              0.013531463,
-              0.05862551,
-              -0.0030636105,
-              -0.031532496,
-              0.08256397,
-              -0.031230088,
-              -0.12059464,
-              0.03833127,
-              0.06573049,
-              0.064165965,
-              0.03838281,
-              0.12570563,
-              0.031128457,
-              0.10817016,
-              -0.001977333,
-              -0.024726717,
-              0.028785817,
-              0.012688804,
-              -0.039854225,
-              0.043296516,
-              -0.015909227,
-              -0.013514834,
-              -0.005097704,
-              -0.007898244,
-              0.0397803,
-              0.0037018042,
-              -0.03366439,
-              -0.058511946,
-              0.0048645996,
-              -0.08961216,
-              -0.010436317,
-              0.05919557,
-              -0.020386472,
-              0.014281465,
-              0.013961121,
-              -0.0045877,
-              0.03835435,
-              0.004833604,
-              0.029750798,
-              -0.02082645,
-              0.018628312,
-              0.124215424,
-              -0.023262355,
-              -0.0403046,
-              -0.023597443,
-              -0.0074503124,
-              -0.09082856,
-              -0.16860788,
-              0.010149646,
-              -0.03580583,
-              0.0105862,
-              -0.02046927,
-              0.0021231866,
-              -0.109239034,
-              0.007925489,
-              0.048885852,
-              -0.11390797,
-              -0.060719617,
-              -0.13435687,
-              0.006331373,
-              -0.008848544,
-              -0.031521764,
-              0.09917924,
-              0.055304468,
-              0.0068802955,
-              -0.023466706,
-              -0.0031231036,
-              0.036759574,
-              0.014334804,
-              0.022158744,
-              0.04709372,
-              0.007092632,
-              0.06810656,
-              0.018511463,
-              0.040857043,
-              0.05504883,
-              0.09488118,
-              -0.01585433,
-              -0.000100159355,
-              0.01078331,
-              0.09177411,
-              -0.07465409,
-              -0.064712845,
-              0.070150875,
-              -0.044969488,
-              0.057672877,
-              -0.026067073,
-              0.0063218353,
-              -0.094980195,
-              -0.010527798,
-              -0.07887331,
-              0.039760627,
-              -0.041514914,
-              -0.055244483,
-              0.07536157,
-              -0.046700213,
-              0.03613181,
-              0.08028084,
-              -0.03635332,
-              -0.034757905,
-              0.0169972,
-              -0.04701302,
-              -0.06517364,
-              0.06215512,
-              -4.2211668e-33,
-              -0.001730556,
-              -0.09387539,
-              -0.029811831,
-              0.12576838,
-              0.03797533,
-              -0.036525473,
-              0.0060974187,
-              0.059078563,
-              -0.110772625,
-              0.005687099,
-              -0.025972685,
-              -0.074838035,
-              0.0083624,
-              0.0274395,
-              -0.052505072,
-              0.023982009,
-              -0.004383019,
-              0.03933067,
-              -0.0421536,
-              -0.0273022,
-              0.05469264,
-              0.027077684,
-              -0.033308104,
-              -0.060588703,
-              -0.050718505,
-              0.017972048,
-              -0.003501518,
-              -0.046666663,
-              0.073935315,
-              0.01332508,
-              -0.003336597,
-              -0.04653879,
-              -0.060137972,
-              0.034129404,
-              0.0015396234,
-              0.03913038,
-              0.039914686,
-              -0.012313295,
-              -0.03049878,
-              -0.001898293,
-              -0.014593095,
-              -0.013025945,
-              0.019526742,
-              -0.022328524,
-              0.07434842,
-              -0.05336983,
-              -0.02397039,
-              0.029210743,
-              0.027515827,
-              0.015095782,
-              -0.020450259,
-              0.043337505,
-              0.019659057,
-              0.01736381,
-              -0.0035567854,
-              0.019467248,
-              -0.0003600355,
-              0.0004236338,
-              -0.0051459596,
-              0.06621258,
-              0.027880289,
-              0.04102983,
-              -0.06717971,
-              0.028754033,
-              -0.03474935,
-              -0.055536743,
-              -0.032726888,
-              -0.08101375,
-              0.092146546,
-              0.06396539,
-              -0.04917468,
-              -0.039915428,
-              0.036926597,
-              -0.0015941713,
-              0.00030078198,
-              -0.026029347,
-              -0.006002226,
-              0.0547852,
-              -0.0956802,
-              -0.05187664,
-              -0.048835263,
-              -0.08641023,
-              -0.033999704,
-              -0.033261146,
-              -0.05655725,
-              -0.051167108,
-              0.008072844,
-              -0.08582387,
-              0.06508922,
-              -0.08545701,
-              0.027998457,
-              0.029824113,
-              -0.031671796,
-              -0.08560477,
-              0.101766,
-              2.1853336e-33,
-              0.011631667,
-              0.07766936,
-              -0.017357787,
-              0.00522221,
-              0.0009766584,
-              0.06540673,
-              0.07256414,
-              -0.044297714,
-              -0.04751489,
-              0.14031266,
-              -0.02573919,
-              0.005799934,
-              0.040961996,
-              -0.054869186,
-              0.074385494,
-              -0.023611594,
-              0.018366067,
-              -0.06055796,
-              -0.04411962,
-              0.0027609242,
-              -0.0457808,
-              0.11723751,
-              0.10269976,
-              0.079064004,
-              -0.046609085,
-              0.018625101,
-              0.02980095,
-              0.037249736,
-              0.022749124,
-              -0.002641677,
-              0.04173634,
-              0.06440922,
-              -0.08910874,
-              0.018179348,
-              0.024035122,
-              -0.09641835,
-              0.086450025,
-              -0.053884093,
-              0.01923183,
-              0.045059275,
-              0.045154754,
-              0.096540354,
-              0.014918263,
-              0.05959024,
-              0.03068157,
-              0.05884942,
-              0.11149687,
-              0.01664536,
-              0.011553633,
-              -0.023707153,
-              -0.008613074,
-              -0.055065807,
-              0.047565654,
-              -0.014617207,
-              -0.01412784,
-              0.06996046,
-              0.032047763,
-              0.04266437,
-              -0.053910665,
-              0.031057829,
-              0.009195878,
-              0.032976385,
-              -0.018986467,
-              0.00552569,
-              -0.014989692,
-              -0.09192638,
-              -0.032122552,
-              0.015356909,
-              0.02916829,
-              0.012490537,
-              -0.00481679,
-              0.02338388,
-              -0.028228622,
-              -0.0845363,
-              0.051079277,
-              -0.013396008,
-              -0.029029451,
-              -0.022589581,
-              0.010921808,
-              -0.009802942,
-              0.049751375,
-              -0.0032863966,
-              -0.038782034,
-              0.027910566,
-              0.017915333,
-              0.005342976,
-              0.058715835,
-              0.0958275,
-              -0.014351606,
-              0.006968306,
-              -0.027336437,
-              0.06917409,
-              0.057280898,
-              0.032035258,
-              0.004253816,
-              -1.6765805e-08,
-              -0.03635166,
-              -0.091484524,
-              -0.026345165,
-              -0.007943707,
-              -0.024149738,
-              0.09897989,
-              -0.04723456,
-              -0.037648056,
-              -0.029387534,
-              -0.022535043,
-              0.041274313,
-              -0.001120282,
-              -0.05565933,
-              0.020671127,
-              -0.03811821,
-              -0.052506164,
-              -0.026291005,
-              -0.053353462,
-              -0.040578876,
-              -0.0073704817,
-              -0.0014502247,
-              0.027114222,
-              0.02715861,
-              0.009327082,
-              -0.0002262999,
-              0.038208842,
-              0.037102137,
-              0.08402326,
-              -0.063428074,
-              -0.014857683,
-              0.0503535,
-              0.06702617,
-              0.027663387,
-              -0.04361141,
-              -0.012074137,
-              0.08499847,
-              0.11162084,
-              0.10458964,
-              0.019746903,
-              -0.0002763885,
-              -0.041129645,
-              0.009574697,
-              -0.05287082,
-              -0.0026483443,
-              -0.031138659,
-              -0.08863464,
-              -0.06762413,
-              -0.074503295,
-              -0.053003356,
-              -0.09557731,
-              -0.052699838,
-              0.013066509,
-              0.0029109598,
-              0.041860294,
-              -0.045234714,
-              0.01671661,
-              0.017218111,
-              0.021572877,
-              -0.037175495,
-              0.023540929,
-              0.051999625,
-              0.064441204,
-              0.023920247,
-              -0.025235547
+              -0.055990793,
+              0.076004684,
+              -0.09247725,
+              0.014340361,
+              0.058780864,
+              -0.032434482,
+              0.020954052,
+              0.028818125,
+              -0.06591213,
+              0.013541593,
+              0.12999941,
+              0.004603084,
+              -0.0069239275,
+              -0.055457443,
+              -0.047553156,
+              -0.029139794,
+              -0.12236376,
+              -0.05360872,
+              -0.014706594,
+              0.05984688,
+              0.034442738,
+              0.02076038,
+              -0.048697792,
+              0.0135388365,
+              0.058592733,
+              -0.003076384,
+              -0.031565297,
+              0.082541116,
+              -0.031259205,
+              -0.12057633,
+              0.038319625,
+              0.06574785,
+              0.06415721,
+              0.038382582,
+              0.12570712,
+              0.03108174,
+              0.10821103,
+              -0.0019794356,
+              -0.024704305,
+              0.028765837,
+              0.01268161,
+              -0.039844505,
+              0.043253522,
+              -0.015898596,
+              -0.0135526005,
+              -0.0050831717,
+              -0.007911988,
+              0.039783813,
+              0.0036548872,
+              -0.033632487,
+              -0.058547974,
+              0.0048877494,
+              -0.089586094,
+              -0.010457663,
+              0.059202507,
+              -0.020414542,
+              0.014278556,
+              0.013986488,
+              -0.0046022516,
+              0.0383391,
+              0.0048145773,
+              0.029772853,
+              -0.020863408,
+              0.018640704,
+              0.12422993,
+              -0.023236223,
+              -0.040323637,
+              -0.023598222,
+              -0.007448043,
+              -0.09083128,
+              -0.16859712,
+              0.01012451,
+              -0.035808884,
+              0.010595173,
+              -0.02050494,
+              0.0020821376,
+              -0.10925222,
+              0.00793264,
+              0.048889533,
+              -0.11391199,
+              -0.06072707,
+              -0.13435508,
+              0.0063265716,
+              -0.008838073,
+              -0.03153269,
+              0.099169336,
+              0.055310693,
+              0.0068571265,
+              -0.023463152,
+              -0.0031599961,
+              0.036782328,
+              0.014336826,
+              0.022220163,
+              0.047114056,
+              0.007079763,
+              0.06806425,
+              0.01851431,
+              0.040882625,
+              0.055058856,
+              0.09488346,
+              -0.015833577,
+              -7.924328e-05,
+              0.010821554,
+              0.09177704,
+              -0.07464829,
+              -0.06471165,
+              0.07013805,
+              -0.04499751,
+              0.057702336,
+              -0.0260911,
+              0.006323043,
+              -0.09500501,
+              -0.010549514,
+              -0.07887475,
+              0.039744847,
+              -0.04154404,
+              -0.055268157,
+              0.07540271,
+              -0.04667509,
+              0.036143072,
+              0.080297194,
+              -0.036381353,
+              -0.03477274,
+              0.01701203,
+              -0.047007203,
+              -0.06519774,
+              0.062141683,
+              -4.222482e-33,
+              -0.0017580023,
+              -0.09383388,
+              -0.02982657,
+              0.1257841,
+              0.03802007,
+              -0.03654342,
+              0.0060920226,
+              0.05906885,
+              -0.11074452,
+              0.005664566,
+              -0.0259852,
+              -0.074819505,
+              0.008342821,
+              0.027451068,
+              -0.05248069,
+              0.02401768,
+              -0.004380289,
+              0.039321493,
+              -0.04213744,
+              -0.027290314,
+              0.054677974,
+              0.02707243,
+              -0.03329442,
+              -0.060589895,
+              -0.050737355,
+              0.017969057,
+              -0.0035060972,
+              -0.04666249,
+              0.073946096,
+              0.01333894,
+              -0.0033873583,
+              -0.046544433,
+              -0.060105033,
+              0.03406923,
+              0.001542676,
+              0.039177947,
+              0.03989323,
+              -0.012346489,
+              -0.030511485,
+              -0.0019157606,
+              -0.014608986,
+              -0.012997742,
+              0.019522104,
+              -0.022349002,
+              0.074362256,
+              -0.053366993,
+              -0.023993475,
+              0.029225096,
+              0.027534606,
+              0.015111057,
+              -0.020442221,
+              0.043327376,
+              0.019660354,
+              0.017330697,
+              -0.0035011724,
+              0.019482937,
+              -0.0003428041,
+              0.0004143988,
+              -0.005117252,
+              0.06624799,
+              0.027922852,
+              0.041020587,
+              -0.067166425,
+              0.028737254,
+              -0.03478325,
+              -0.055551115,
+              -0.032713737,
+              -0.08099247,
+              0.09216284,
+              0.06395264,
+              -0.049168136,
+              -0.039908994,
+              0.036915958,
+              -0.001602359,
+              0.00033041168,
+              -0.026015632,
+              -0.005999889,
+              0.05474541,
+              -0.09568287,
+              -0.05186289,
+              -0.048838183,
+              -0.08639551,
+              -0.034023147,
+              -0.033257127,
+              -0.05651867,
+              -0.051131375,
+              0.00809173,
+              -0.08581851,
+              0.06507323,
+              -0.085427366,
+              0.027997404,
+              0.029847065,
+              -0.031673994,
+              -0.08560956,
+              0.1017672,
+              2.1855676e-33,
+              0.01160785,
+              0.077607885,
+              -0.017380483,
+              0.005239329,
+              0.0009684126,
+              0.06543702,
+              0.07256893,
+              -0.044318836,
+              -0.04749324,
+              0.14031002,
+              -0.025741624,
+              0.0057860985,
+              0.040946104,
+              -0.054880083,
+              0.074413285,
+              -0.023610368,
+              0.018364722,
+              -0.060585637,
+              -0.044149306,
+              0.0027854694,
+              -0.04580664,
+              0.1172219,
+              0.10268574,
+              0.07907412,
+              -0.0466143,
+              0.018618405,
+              0.029834948,
+              0.037265483,
+              0.02273822,
+              -0.0026589038,
+              0.041726097,
+              0.06439532,
+              -0.089163445,
+              0.018188318,
+              0.024064727,
+              -0.096389584,
+              0.08642254,
+              -0.05389359,
+              0.01923105,
+              0.045092683,
+              0.045125954,
+              0.09655961,
+              0.014908797,
+              0.059611585,
+              0.03066662,
+              0.05882299,
+              0.111484826,
+              0.016632542,
+              0.011590394,
+              -0.023702666,
+              -0.008617484,
+              -0.055030316,
+              0.047606383,
+              -0.014632687,
+              -0.014156344,
+              0.069926,
+              0.032047603,
+              0.042642817,
+              -0.053942375,
+              0.031047028,
+              0.009216673,
+              0.033024028,
+              -0.019033706,
+              0.005568194,
+              -0.014985451,
+              -0.09193244,
+              -0.03210824,
+              0.015367608,
+              0.029150328,
+              0.01250386,
+              -0.004827391,
+              0.023345906,
+              -0.028271332,
+              -0.08454125,
+              0.051068563,
+              -0.0133641455,
+              -0.029022738,
+              -0.02258452,
+              0.010884119,
+              -0.009810021,
+              0.049751773,
+              -0.0032637494,
+              -0.038813565,
+              0.027924104,
+              0.017925078,
+              0.005337612,
+              0.058691237,
+              0.09577674,
+              -0.014308608,
+              0.006972794,
+              -0.02733344,
+              0.06912433,
+              0.05727631,
+              0.03206042,
+              0.0042422824,
+              -1.6766318e-08,
+              -0.036354303,
+              -0.09146416,
+              -0.026319364,
+              -0.007941995,
+              -0.024127059,
+              0.09896698,
+              -0.04723083,
+              -0.03767135,
+              -0.029419973,
+              -0.022513283,
+              0.04125822,
+              -0.0011487947,
+              -0.05570366,
+              0.020679709,
+              -0.038118906,
+              -0.0524994,
+              -0.02624128,
+              -0.05336954,
+              -0.040593866,
+              -0.0073642326,
+              -0.0014442836,
+              0.02714257,
+              0.027141048,
+              0.00932513,
+              -0.00026505854,
+              0.038233075,
+              0.037096914,
+              0.08405413,
+              -0.06340637,
+              -0.014856458,
+              0.05038612,
+              0.06703033,
+              0.027668556,
+              -0.04360097,
+              -0.012041474,
+              0.08500689,
+              0.111594744,
+              0.1046117,
+              0.019726463,
+              -0.0003025109,
+              -0.04110389,
+              0.009575226,
+              -0.05285304,
+              -0.0026365265,
+              -0.031144748,
+              -0.08860188,
+              -0.06762232,
+              -0.07451522,
+              -0.053012833,
+              -0.09560941,
+              -0.05273455,
+              0.013032144,
+              0.0029190276,
+              0.041905046,
+              -0.04522114,
+              0.016730292,
+              0.017214278,
+              0.021578068,
+              -0.03718778,
+              0.02353425,
+              0.052041385,
+              0.06444499,
+              0.02387539,
+              -0.025236009
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/2afe3b38ca01.json b/tests/integration/recordings/responses/2afe3b38ca01.json
index 4b5c82ad4..270d2744c 100644
--- a/tests/integration/recordings/responses/2afe3b38ca01.json
+++ b/tests/integration/recordings/responses/2afe3b38ca01.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:01.887809Z",
+          "created_at": "2025-09-03T17:37:50.436472Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:01.942369Z",
+          "created_at": "2025-09-03T17:37:50.478138Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:01.99605Z",
+          "created_at": "2025-09-03T17:37:50.519952Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.049974Z",
+          "created_at": "2025-09-03T17:37:50.561433Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.102027Z",
+          "created_at": "2025-09-03T17:37:50.603624Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.158416Z",
+          "created_at": "2025-09-03T17:37:50.645851Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.211753Z",
+          "created_at": "2025-09-03T17:37:50.688403Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.265564Z",
+          "created_at": "2025-09-03T17:37:50.72991Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.31618Z",
+          "created_at": "2025-09-03T17:37:50.771635Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.370325Z",
+          "created_at": "2025-09-03T17:37:50.813711Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.424667Z",
+          "created_at": "2025-09-03T17:37:50.856201Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.47913Z",
+          "created_at": "2025-09-03T17:37:50.899048Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,15 +238,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:02.536984Z",
+          "created_at": "2025-09-03T17:37:50.94069Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1042724125,
-          "load_duration": 86161375,
+          "total_duration": 688370708,
+          "load_duration": 107469833,
           "prompt_eval_count": 399,
-          "prompt_eval_duration": 305000000,
+          "prompt_eval_duration": 74988334,
           "eval_count": 13,
-          "eval_duration": 650000000,
+          "eval_duration": 505216458,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/2d187a11704c.json b/tests/integration/recordings/responses/2d187a11704c.json
index fbfcb91f8..c0f746ffe 100644
--- a/tests/integration/recordings/responses/2d187a11704c.json
+++ b/tests/integration/recordings/responses/2d187a11704c.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:11.938867Z",
+          "created_at": "2025-09-03T17:37:56.566151Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:11.991247Z",
+          "created_at": "2025-09-03T17:37:56.609308Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.043953Z",
+          "created_at": "2025-09-03T17:37:56.651314Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.096001Z",
+          "created_at": "2025-09-03T17:37:56.693185Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.150454Z",
+          "created_at": "2025-09-03T17:37:56.734643Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.201249Z",
+          "created_at": "2025-09-03T17:37:56.776343Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.252534Z",
+          "created_at": "2025-09-03T17:37:56.81705Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.30063Z",
+          "created_at": "2025-09-03T17:37:56.857959Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.351034Z",
+          "created_at": "2025-09-03T17:37:56.899424Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.405032Z",
+          "created_at": "2025-09-03T17:37:56.939218Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.462645Z",
+          "created_at": "2025-09-03T17:37:56.980065Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.520337Z",
+          "created_at": "2025-09-03T17:37:57.02214Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,7 +238,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.575809Z",
+          "created_at": "2025-09-03T17:37:57.0628Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -256,7 +256,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.633724Z",
+          "created_at": "2025-09-03T17:37:57.106061Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -274,7 +274,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.683133Z",
+          "created_at": "2025-09-03T17:37:57.1492Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -292,7 +292,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.734309Z",
+          "created_at": "2025-09-03T17:37:57.190075Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -310,7 +310,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.785917Z",
+          "created_at": "2025-09-03T17:37:57.23178Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -328,7 +328,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.835705Z",
+          "created_at": "2025-09-03T17:37:57.272738Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -346,7 +346,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.886509Z",
+          "created_at": "2025-09-03T17:37:57.313855Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -364,7 +364,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.937134Z",
+          "created_at": "2025-09-03T17:37:57.354964Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -382,7 +382,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:12.988532Z",
+          "created_at": "2025-09-03T17:37:57.395971Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -400,7 +400,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.041798Z",
+          "created_at": "2025-09-03T17:37:57.438471Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -418,7 +418,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.095443Z",
+          "created_at": "2025-09-03T17:37:57.479796Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -436,7 +436,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.151402Z",
+          "created_at": "2025-09-03T17:37:57.520641Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -454,7 +454,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.203462Z",
+          "created_at": "2025-09-03T17:37:57.561511Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -472,7 +472,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.254567Z",
+          "created_at": "2025-09-03T17:37:57.602875Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -490,7 +490,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.305865Z",
+          "created_at": "2025-09-03T17:37:57.643406Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -508,7 +508,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.357658Z",
+          "created_at": "2025-09-03T17:37:57.684279Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -526,7 +526,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.407773Z",
+          "created_at": "2025-09-03T17:37:57.725699Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -544,7 +544,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.458919Z",
+          "created_at": "2025-09-03T17:37:57.766658Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -562,7 +562,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.510456Z",
+          "created_at": "2025-09-03T17:37:57.80738Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -580,7 +580,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.565948Z",
+          "created_at": "2025-09-03T17:37:57.848466Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -598,7 +598,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.619155Z",
+          "created_at": "2025-09-03T17:37:57.889056Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -616,7 +616,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.672754Z",
+          "created_at": "2025-09-03T17:37:57.931554Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -634,7 +634,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.729473Z",
+          "created_at": "2025-09-03T17:37:57.974754Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -652,7 +652,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.788666Z",
+          "created_at": "2025-09-03T17:37:58.016978Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -670,7 +670,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.850575Z",
+          "created_at": "2025-09-03T17:37:58.057942Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -688,7 +688,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.904807Z",
+          "created_at": "2025-09-03T17:37:58.099015Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -706,7 +706,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:13.958524Z",
+          "created_at": "2025-09-03T17:37:58.140531Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -724,7 +724,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.011742Z",
+          "created_at": "2025-09-03T17:37:58.181382Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -742,7 +742,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.064933Z",
+          "created_at": "2025-09-03T17:37:58.223318Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -760,7 +760,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.116454Z",
+          "created_at": "2025-09-03T17:37:58.26358Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -778,7 +778,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.172682Z",
+          "created_at": "2025-09-03T17:37:58.305496Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -796,7 +796,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.227654Z",
+          "created_at": "2025-09-03T17:37:58.347254Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -814,7 +814,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.282068Z",
+          "created_at": "2025-09-03T17:37:58.390044Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -832,7 +832,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.334565Z",
+          "created_at": "2025-09-03T17:37:58.430867Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -850,7 +850,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.383532Z",
+          "created_at": "2025-09-03T17:37:58.471376Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -868,7 +868,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.432138Z",
+          "created_at": "2025-09-03T17:37:58.51208Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -886,7 +886,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.480995Z",
+          "created_at": "2025-09-03T17:37:58.553226Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -904,7 +904,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.531968Z",
+          "created_at": "2025-09-03T17:37:58.594787Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -922,7 +922,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.584044Z",
+          "created_at": "2025-09-03T17:37:58.63466Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -940,7 +940,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.635691Z",
+          "created_at": "2025-09-03T17:37:58.674628Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -958,7 +958,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.68837Z",
+          "created_at": "2025-09-03T17:37:58.714616Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -976,7 +976,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.73985Z",
+          "created_at": "2025-09-03T17:37:58.754906Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -994,7 +994,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.792412Z",
+          "created_at": "2025-09-03T17:37:58.795048Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1012,7 +1012,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.845872Z",
+          "created_at": "2025-09-03T17:37:58.835297Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1030,7 +1030,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.900102Z",
+          "created_at": "2025-09-03T17:37:58.875738Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1048,7 +1048,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:14.954589Z",
+          "created_at": "2025-09-03T17:37:58.91604Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1066,7 +1066,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.006629Z",
+          "created_at": "2025-09-03T17:37:58.956596Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1084,7 +1084,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.058561Z",
+          "created_at": "2025-09-03T17:37:58.996664Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1102,7 +1102,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.111954Z",
+          "created_at": "2025-09-03T17:37:59.037796Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1120,7 +1120,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.169173Z",
+          "created_at": "2025-09-03T17:37:59.078586Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1138,7 +1138,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.222569Z",
+          "created_at": "2025-09-03T17:37:59.119448Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1156,7 +1156,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.275795Z",
+          "created_at": "2025-09-03T17:37:59.160318Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1174,7 +1174,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.3327Z",
+          "created_at": "2025-09-03T17:37:59.201852Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1192,7 +1192,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.389931Z",
+          "created_at": "2025-09-03T17:37:59.243763Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1210,7 +1210,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.442349Z",
+          "created_at": "2025-09-03T17:37:59.284948Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1228,7 +1228,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.494175Z",
+          "created_at": "2025-09-03T17:37:59.325598Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1246,7 +1246,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.545764Z",
+          "created_at": "2025-09-03T17:37:59.366289Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1264,7 +1264,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.599099Z",
+          "created_at": "2025-09-03T17:37:59.406764Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1282,7 +1282,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.649852Z",
+          "created_at": "2025-09-03T17:37:59.447922Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1300,7 +1300,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.698222Z",
+          "created_at": "2025-09-03T17:37:59.488486Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1318,7 +1318,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.747168Z",
+          "created_at": "2025-09-03T17:37:59.529Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1336,7 +1336,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.797196Z",
+          "created_at": "2025-09-03T17:37:59.569417Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1354,7 +1354,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.845587Z",
+          "created_at": "2025-09-03T17:37:59.610542Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1372,7 +1372,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.897171Z",
+          "created_at": "2025-09-03T17:37:59.651411Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1390,7 +1390,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.944524Z",
+          "created_at": "2025-09-03T17:37:59.69241Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1408,7 +1408,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:15.994467Z",
+          "created_at": "2025-09-03T17:37:59.732339Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1426,7 +1426,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.045224Z",
+          "created_at": "2025-09-03T17:37:59.772462Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1444,7 +1444,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.093853Z",
+          "created_at": "2025-09-03T17:37:59.812507Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1462,7 +1462,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.144847Z",
+          "created_at": "2025-09-03T17:37:59.852762Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1480,7 +1480,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.197888Z",
+          "created_at": "2025-09-03T17:37:59.892984Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1498,7 +1498,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.250854Z",
+          "created_at": "2025-09-03T17:37:59.933555Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1516,7 +1516,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.301995Z",
+          "created_at": "2025-09-03T17:37:59.973778Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1534,7 +1534,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.352508Z",
+          "created_at": "2025-09-03T17:38:00.014923Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1552,7 +1552,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.40259Z",
+          "created_at": "2025-09-03T17:38:00.057464Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1570,7 +1570,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.453514Z",
+          "created_at": "2025-09-03T17:38:00.09902Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1588,7 +1588,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.50378Z",
+          "created_at": "2025-09-03T17:38:00.140492Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1606,7 +1606,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.554395Z",
+          "created_at": "2025-09-03T17:38:00.180239Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1624,7 +1624,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.605795Z",
+          "created_at": "2025-09-03T17:38:00.220364Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1642,7 +1642,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.656313Z",
+          "created_at": "2025-09-03T17:38:00.26097Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1660,7 +1660,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.706438Z",
+          "created_at": "2025-09-03T17:38:00.301228Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1678,7 +1678,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.756444Z",
+          "created_at": "2025-09-03T17:38:00.341631Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1696,7 +1696,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.807687Z",
+          "created_at": "2025-09-03T17:38:00.383006Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1714,7 +1714,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.85835Z",
+          "created_at": "2025-09-03T17:38:00.423509Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1732,7 +1732,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.909311Z",
+          "created_at": "2025-09-03T17:38:00.464702Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1750,7 +1750,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:16.959327Z",
+          "created_at": "2025-09-03T17:38:00.505914Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1768,7 +1768,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:17.010211Z",
+          "created_at": "2025-09-03T17:38:00.546505Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1786,7 +1786,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:17.061365Z",
+          "created_at": "2025-09-03T17:38:00.587839Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1804,15 +1804,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:17.111956Z",
+          "created_at": "2025-09-03T17:38:00.629018Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 5499672375,
-          "load_duration": 58161750,
+          "total_duration": 4303339291,
+          "load_duration": 156231250,
           "prompt_eval_count": 36,
-          "prompt_eval_duration": 266000000,
+          "prompt_eval_duration": 81909875,
           "eval_count": 100,
-          "eval_duration": 5174000000,
+          "eval_duration": 4064559292,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/325a72db5755.json b/tests/integration/recordings/responses/325a72db5755.json
index a41db435b..ca3eea2f3 100644
--- a/tests/integration/recordings/responses/325a72db5755.json
+++ b/tests/integration/recordings/responses/325a72db5755.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -21,7 +21,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -36,7 +36,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -47,7 +47,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -62,7 +62,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -73,7 +73,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -88,7 +88,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -99,7 +99,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -114,7 +114,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -125,7 +125,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -140,7 +140,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -151,7 +151,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -166,7 +166,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -177,7 +177,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -192,7 +192,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -203,7 +203,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -218,7 +218,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -229,7 +229,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -244,7 +244,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -255,7 +255,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -270,7 +270,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081853,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -281,7 +281,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -296,7 +296,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -307,7 +307,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -322,7 +322,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -333,7 +333,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -348,7 +348,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -359,7 +359,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -374,7 +374,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -385,7 +385,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -400,7 +400,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921364,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -411,7 +411,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -426,7 +426,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921365,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -437,7 +437,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -452,7 +452,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921365,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -463,7 +463,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -478,7 +478,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921365,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -489,7 +489,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -504,7 +504,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921365,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -515,7 +515,683 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-312",
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " It",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": "'s",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " a",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " federally",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " owned",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " district",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " that",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " serves",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " as",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " seat",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " federal",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " government",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " housing",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " many",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " national",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " landmarks",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921365,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " institutions",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921366,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921366,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " and",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921366,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": " offices",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921366,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921366,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-923",
           "choices": [
             {
               "delta": {
@@ -530,7 +1206,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081854,
+          "created": 1756921366,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/382c2f22274c.json b/tests/integration/recordings/responses/382c2f22274c.json
index 6d05649a5..eb4a24f47 100644
--- a/tests/integration/recordings/responses/382c2f22274c.json
+++ b/tests/integration/recordings/responses/382c2f22274c.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -22,14 +22,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-339",
+        "id": "chatcmpl-442",
         "choices": [
           {
             "finish_reason": "length",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "I can guide you through the process, but please note that this is not an official OpenAI API call. OpenAI's API terms and conditions prohibit using their models for malicious purposes.\n\nTo test a model like \"text-temperature\" with a temperature of 0 (i.e., no noise or randomness), we'll need to use a third-party library that connects to the OpenAI API. One such library is `transformers`.\n\nFirst, you need to install the `transformers` and `",
+              "content": "I can guide you on how to use the `test-temperature` parameter with OpenAI's API, but please note that using a temperature of 0 may not produce meaningful results. Temperature is a hyperparameter that controls the level of randomness in the model's output.\n\nOpenAI's API uses a variant of the GPT-3 model, which is trained on a large corpus of text data. The `test-temperature` parameter allows you to adjust the level of randomness in the model's output",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -39,7 +39,7 @@
             }
           }
         ],
-        "created": 1754510065,
+        "created": 1756921254,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
diff --git a/tests/integration/recordings/responses/3c0bf9ba81b2.json b/tests/integration/recordings/responses/3c0bf9ba81b2.json
index 1b5f16c22..3d2b85e8d 100644
--- a/tests/integration/recordings/responses/3c0bf9ba81b2.json
+++ b/tests/integration/recordings/responses/3c0bf9ba81b2.json
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-651",
+        "id": "chatcmpl-334",
         "choices": [
           {
             "finish_reason": "length",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "I'm ready to help",
+              "content": "It looks like we've",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,7 +37,7 @@
             }
           }
         ],
-        "created": 1755294941,
+        "created": 1756921086,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
diff --git a/tests/integration/recordings/responses/3c3f13cb7794.json b/tests/integration/recordings/responses/3c3f13cb7794.json
index a1f240a9c..117fbcceb 100644
--- a/tests/integration/recordings/responses/3c3f13cb7794.json
+++ b/tests/integration/recordings/responses/3c3f13cb7794.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.338232Z",
+          "created_at": "2025-09-03T17:36:18.136699Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.39419Z",
+          "created_at": "2025-09-03T17:36:18.177622Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.445346Z",
+          "created_at": "2025-09-03T17:36:18.218104Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.496701Z",
+          "created_at": "2025-09-03T17:36:18.258837Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.546804Z",
+          "created_at": "2025-09-03T17:36:18.299715Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.601009Z",
+          "created_at": "2025-09-03T17:36:18.341602Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.652788Z",
+          "created_at": "2025-09-03T17:36:18.385504Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.703325Z",
+          "created_at": "2025-09-03T17:36:18.429427Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.754033Z",
+          "created_at": "2025-09-03T17:36:18.473547Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.804654Z",
+          "created_at": "2025-09-03T17:36:18.516327Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,15 +201,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:11.854841Z",
+          "created_at": "2025-09-03T17:36:18.559332Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 652371000,
-          "load_duration": 42086042,
+          "total_duration": 628034000,
+          "load_duration": 116384417,
           "prompt_eval_count": 26,
-          "prompt_eval_duration": 78000000,
+          "prompt_eval_duration": 87798792,
           "eval_count": 11,
-          "eval_duration": 531000000,
+          "eval_duration": 423189583,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/3ca695048bee.json b/tests/integration/recordings/responses/3ca695048bee.json
index bed6762e7..b307b2f98 100644
--- a/tests/integration/recordings/responses/3ca695048bee.json
+++ b/tests/integration/recordings/responses/3ca695048bee.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -39,7 +39,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-490",
+          "id": "chatcmpl-3",
           "choices": [
             {
               "delta": {
@@ -50,7 +50,7 @@
                 "tool_calls": [
                   {
                     "index": 0,
-                    "id": "call_rolv1ozt",
+                    "id": "call_3kigugt3",
                     "function": {
                       "arguments": "{\"city\":\"Tokyo\"}",
                       "name": "get_weather"
@@ -64,7 +64,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081852,
+          "created": 1756921361,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -75,7 +75,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-490",
+          "id": "chatcmpl-3",
           "choices": [
             {
               "delta": {
@@ -85,12 +85,12 @@
                 "role": "assistant",
                 "tool_calls": null
               },
-              "finish_reason": "stop",
+              "finish_reason": "tool_calls",
               "index": 0,
               "logprobs": null
             }
           ],
-          "created": 1754081852,
+          "created": 1756921361,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/3dff18060ebc.json b/tests/integration/recordings/responses/3dff18060ebc.json
index e04bb8be7..c3da2998e 100644
--- a/tests/integration/recordings/responses/3dff18060ebc.json
+++ b/tests/integration/recordings/responses/3dff18060ebc.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.060643002,
-              0.063731536,
-              -0.059394535,
-              -0.010293381,
-              -0.119798504,
-              0.033409704,
-              0.056838214,
-              -0.006487789,
-              0.029893834,
-              -0.05035498,
-              0.015207984,
-              -0.0634482,
-              0.015118864,
-              -0.08356639,
-              0.009297568,
-              0.04425259,
-              -0.02442732,
-              -0.050995167,
-              -0.028106945,
-              -0.07392448,
-              0.070876844,
-              0.08103935,
-              0.006026678,
-              -0.043081142,
-              0.010737864,
-              -0.01581646,
-              0.035146058,
-              0.06534572,
-              0.036411658,
-              -0.056240093,
-              0.073675275,
-              0.047330413,
-              0.06715632,
-              -0.012079616,
-              -0.018175518,
-              0.0042696777,
-              0.029169064,
-              0.006755428,
-              0.037944797,
-              0.002459526,
-              0.014023556,
-              0.022665394,
-              -0.09053435,
-              0.041958958,
-              -0.0793576,
-              0.032003723,
-              -0.03836551,
-              0.037002493,
-              -0.0036971096,
-              -0.017005432,
-              0.036977224,
-              -0.077020966,
-              -0.020112924,
-              0.07730264,
-              0.04523538,
-              -0.007810078,
-              -0.005882345,
-              0.009965143,
-              0.033477366,
-              0.08996437,
-              0.016154636,
-              0.03699466,
-              -0.03920663,
-              -0.010970169,
-              0.023925098,
-              -0.036968958,
-              -0.008223206,
-              0.018760787,
-              -0.000688964,
-              -0.061974872,
-              -0.030354673,
-              -0.03764463,
-              -0.046544887,
-              0.03845807,
-              -0.010353121,
-              -0.032976467,
-              0.013553099,
-              -0.059050683,
-              0.06307999,
-              0.015977552,
-              -0.048430033,
-              -0.06991109,
-              -0.022508044,
-              0.04406567,
-              0.036172677,
-              0.060487013,
-              -0.04315455,
-              0.028775847,
-              0.006216682,
-              0.01028539,
-              -0.07873024,
-              -0.091566674,
-              0.043936655,
-              0.013187522,
-              -0.0037702306,
-              0.010252617,
-              0.020211454,
-              0.056324948,
-              -0.09704479,
-              0.06579238,
-              0.047095913,
-              0.018813917,
-              0.124447405,
-              -0.064461194,
-              -0.012602576,
-              0.016044088,
-              0.0860477,
-              0.02487444,
-              0.106261514,
-              -0.043173406,
-              -0.04631391,
-              -0.031489294,
-              -0.0018045203,
-              -0.0234808,
-              -0.050789703,
-              0.0046832566,
-              0.04323459,
-              0.057140227,
-              -0.065862894,
-              0.032980002,
-              -0.028766194,
-              0.03784897,
-              0.0002090952,
-              0.04331736,
-              -0.13265643,
-              0.026365368,
-              -0.042440306,
-              -3.335036e-33,
-              -0.0022078454,
-              0.050638728,
-              0.028040074,
-              -0.0339003,
-              -0.004550283,
-              -0.034626767,
-              -0.086259365,
-              0.04313123,
-              0.010241412,
-              0.04403283,
-              -0.030186933,
-              -0.0935834,
-              -0.06522679,
-              -0.059730206,
-              0.037564293,
-              -0.025941465,
-              -0.06653215,
-              0.004382199,
-              0.018841932,
-              -0.03557901,
-              0.022377534,
-              0.0894181,
-              0.033572253,
-              -0.11379638,
-              0.038214155,
-              -0.0444022,
-              0.10258949,
-              -0.07330576,
-              0.089417316,
-              0.05668133,
-              -0.009440494,
-              -0.06464684,
-              0.016628003,
-              0.0073475256,
-              0.00518807,
-              0.0051437207,
-              -0.013597164,
-              -0.04918519,
-              -0.06671375,
-              0.010821772,
-              0.04635121,
-              -0.11489337,
-              -0.055055846,
-              0.040418062,
-              -0.0327241,
-              0.034979116,
-              -0.02358068,
-              -0.012229059,
-              0.048057053,
-              0.011607797,
-              0.00786425,
-              0.038057882,
-              -0.027768329,
-              0.0033014645,
-              -0.0033301115,
-              0.006048222,
-              0.031986434,
-              0.04835162,
-              0.013795478,
-              0.03616475,
-              -0.022675272,
-              0.09197521,
-              0.029851481,
-              0.08111755,
-              -0.086777106,
-              -0.028026069,
-              0.055648096,
-              -0.030405777,
-              -0.016515536,
-              0.031827636,
-              -0.07586154,
-              -0.009904298,
-              0.028109884,
-              0.0022400685,
-              -0.104984276,
-              -0.023682386,
-              -0.02420211,
-              -0.00031999213,
-              0.0016354885,
-              -0.037583202,
-              0.02554201,
-              -0.052216183,
-              0.021622796,
-              0.099114954,
-              -0.06895898,
-              -0.018579148,
-              0.072459795,
-              -0.10584089,
-              -0.08503219,
-              -0.030006522,
-              -0.01574946,
-              -0.056850888,
-              -0.02701468,
-              -0.06409775,
-              0.0057065156,
-              1.2905196e-33,
-              0.054916188,
-              -0.036421828,
-              -0.0023367621,
-              -0.03591332,
-              0.10682448,
-              -0.049314465,
-              0.037890658,
-              0.05061744,
-              -0.08387186,
-              -0.018746993,
-              0.0036053627,
-              0.029014338,
-              -0.0028278087,
-              -0.036458995,
-              0.11148448,
-              0.050991904,
-              0.040261153,
-              0.092449345,
-              -0.013685468,
-              -0.07097927,
-              -0.043229934,
-              -0.060135942,
-              -0.030182164,
-              0.009103864,
-              -0.04419895,
-              0.04841717,
-              0.1172092,
-              -0.009820357,
-              0.0024167346,
-              0.0933731,
-              -0.059857536,
-              0.010170529,
-              -0.03779587,
-              -0.043445412,
-              -0.14679031,
-              -0.022706114,
-              -0.008936355,
-              -0.021539144,
-              -0.021903422,
-              -0.06614074,
-              0.016270082,
-              0.062619805,
-              0.010576195,
-              0.04721768,
-              -0.08721729,
-              0.009404518,
-              -0.017676886,
-              -0.03845903,
-              0.01042728,
-              0.022961272,
-              0.099522196,
-              -0.021459235,
-              0.0017192952,
-              -0.039389413,
-              0.01643467,
-              0.03967745,
-              -0.11970654,
-              0.009909872,
-              0.0038936618,
-              0.018281214,
-              -0.045416683,
-              0.002060889,
-              0.024235422,
-              0.016998425,
-              0.06879841,
-              -0.027463643,
-              -0.018185377,
-              0.053853985,
-              -0.02881535,
-              -0.04521435,
-              0.114714146,
-              0.01980149,
-              -0.057876598,
-              0.01657406,
-              -0.073635235,
-              0.040253133,
-              -0.015108487,
-              0.0066914097,
-              -0.049663424,
-              0.04593752,
-              0.077961996,
-              -0.042919736,
-              0.021851214,
-              0.06381258,
-              0.08111257,
-              -0.07067202,
-              -0.032432877,
-              0.09261935,
-              -0.020485587,
-              0.070126526,
-              -0.020741673,
-              0.09339737,
-              -0.05117133,
-              0.039423097,
-              0.025603252,
-              -1.676899e-08,
-              0.0015320816,
-              0.008086889,
-              -0.017632706,
-              -0.0340569,
-              0.068081565,
-              0.07389828,
-              -0.07586309,
-              -0.1137352,
-              -0.02203125,
-              0.00911275,
-              0.031093195,
-              -0.005707322,
-              -0.046190932,
-              0.0037106895,
-              0.013285116,
-              -0.03215832,
-              -0.05558973,
-              -0.010595662,
-              0.0067340815,
-              -0.025494263,
-              -0.08369286,
-              0.08884646,
-              0.0051370384,
-              -0.051632546,
-              -0.051877208,
-              0.039703675,
-              -0.042113848,
-              0.05714819,
-              0.088881046,
-              0.049764536,
-              0.04144229,
-              0.09467376,
-              -0.037112173,
-              -0.06844063,
-              -0.061656013,
-              0.09893085,
-              -0.059514027,
-              -0.033182237,
-              -0.026037138,
-              0.07761722,
-              0.05612508,
-              0.010711438,
-              0.018973859,
-              0.056075387,
-              -0.04172223,
-              -0.02732456,
-              0.101854175,
-              -0.036197703,
-              -0.029915968,
-              -0.043326378,
-              0.043677974,
-              0.018775862,
-              -0.0042756326,
-              0.055917986,
-              -0.0034246107,
-              0.0602753,
-              -0.13372745,
-              0.008189692,
-              -0.031539913,
-              0.022382092,
-              0.037938736,
-              0.024559673,
-              0.068045974,
-              0.07020884
+              -0.060630284,
+              0.06372823,
+              -0.059383437,
+              -0.010313639,
+              -0.11985778,
+              0.033409074,
+              0.056847293,
+              -0.0064553,
+              0.029896382,
+              -0.05037607,
+              0.015193001,
+              -0.0634204,
+              0.015119892,
+              -0.08354324,
+              0.0092577925,
+              0.044272587,
+              -0.024397198,
+              -0.05100177,
+              -0.028086444,
+              -0.07390362,
+              0.07088186,
+              0.08101153,
+              0.006050408,
+              -0.043090094,
+              0.010714593,
+              -0.01581376,
+              0.0351736,
+              0.06538307,
+              0.03639655,
+              -0.05625738,
+              0.073681176,
+              0.04730274,
+              0.067169026,
+              -0.01207242,
+              -0.018193275,
+              0.0042488067,
+              0.029168725,
+              0.0067459582,
+              0.037927665,
+              0.0024767139,
+              0.014044963,
+              0.022671249,
+              -0.090508185,
+              0.041952047,
+              -0.07933115,
+              0.031992197,
+              -0.038355146,
+              0.037013844,
+              -0.0036946274,
+              -0.016986867,
+              0.03696087,
+              -0.07697335,
+              -0.020080294,
+              0.07733012,
+              0.04521822,
+              -0.007816803,
+              -0.0058926586,
+              0.009962128,
+              0.033492323,
+              0.09000152,
+              0.016161384,
+              0.036999356,
+              -0.039193578,
+              -0.010969346,
+              0.023929566,
+              -0.03698458,
+              -0.008227196,
+              0.018780757,
+              -0.0006967325,
+              -0.062018193,
+              -0.030388007,
+              -0.037649162,
+              -0.04654288,
+              0.038450293,
+              -0.010377299,
+              -0.032971557,
+              0.013547814,
+              -0.059036925,
+              0.0630603,
+              0.0159564,
+              -0.04845087,
+              -0.069917254,
+              -0.022502322,
+              0.04408022,
+              0.03618941,
+              0.060470726,
+              -0.04313285,
+              0.028797466,
+              0.0062393937,
+              0.01027349,
+              -0.078714885,
+              -0.091531575,
+              0.04391341,
+              0.013202597,
+              -0.0037814155,
+              0.0102497,
+              0.020225797,
+              0.05634384,
+              -0.09700619,
+              0.06577961,
+              0.047118917,
+              0.01876648,
+              0.12445029,
+              -0.06447121,
+              -0.012632697,
+              0.016056264,
+              0.08604982,
+              0.024878234,
+              0.10627678,
+              -0.043176394,
+              -0.046339765,
+              -0.03149599,
+              -0.001784808,
+              -0.023469802,
+              -0.05079461,
+              0.0046657966,
+              0.043237828,
+              0.057146583,
+              -0.065833576,
+              0.032975562,
+              -0.028763266,
+              0.037831448,
+              0.00017829033,
+              0.043322463,
+              -0.13265091,
+              0.0263673,
+              -0.04247752,
+              -3.3340873e-33,
+              -0.0022191573,
+              0.050657377,
+              0.028066125,
+              -0.033898965,
+              -0.0045730886,
+              -0.034653578,
+              -0.08628417,
+              0.043108672,
+              0.01022734,
+              0.044009056,
+              -0.03020062,
+              -0.0936044,
+              -0.06522928,
+              -0.059762992,
+              0.037560984,
+              -0.025942331,
+              -0.06655938,
+              0.0043691625,
+              0.018846871,
+              -0.035582166,
+              0.02240012,
+              0.08943218,
+              0.033568345,
+              -0.11379316,
+              0.03822112,
+              -0.044403847,
+              0.10261262,
+              -0.07330182,
+              0.089390896,
+              0.056668896,
+              -0.009407597,
+              -0.0646505,
+              0.016652016,
+              0.007326742,
+              0.005187682,
+              0.0051324354,
+              -0.013595071,
+              -0.04918112,
+              -0.06672084,
+              0.010838405,
+              0.04638185,
+              -0.11490209,
+              -0.055054087,
+              0.040443793,
+              -0.032746885,
+              0.03498173,
+              -0.023567867,
+              -0.012213799,
+              0.048050664,
+              0.01159698,
+              0.007860181,
+              0.03801084,
+              -0.027765153,
+              0.003296162,
+              -0.0033349432,
+              0.006083357,
+              0.03200884,
+              0.048306234,
+              0.013800832,
+              0.036165927,
+              -0.022672432,
+              0.09197581,
+              0.029846204,
+              0.08112345,
+              -0.08677228,
+              -0.028041098,
+              0.0556574,
+              -0.030357547,
+              -0.016538681,
+              0.031826265,
+              -0.07586954,
+              -0.009915978,
+              0.028101236,
+              0.002207158,
+              -0.10496646,
+              -0.023673821,
+              -0.024204832,
+              -0.0003132271,
+              0.0016462951,
+              -0.037603874,
+              0.025533162,
+              -0.05221861,
+              0.021656586,
+              0.099111386,
+              -0.06896361,
+              -0.018568028,
+              0.07245527,
+              -0.10582686,
+              -0.08505038,
+              -0.029969748,
+              -0.015717981,
+              -0.056855034,
+              -0.02698479,
+              -0.06410572,
+              0.0057078917,
+              1.2902391e-33,
+              0.05490771,
+              -0.036417797,
+              -0.0023541928,
+              -0.03591478,
+              0.106852315,
+              -0.04931468,
+              0.037884213,
+              0.050633065,
+              -0.083874516,
+              -0.018756155,
+              0.0036251817,
+              0.028974183,
+              -0.0027879397,
+              -0.036439158,
+              0.11148004,
+              0.051007163,
+              0.040258586,
+              0.09245398,
+              -0.01367112,
+              -0.070999645,
+              -0.043213032,
+              -0.060117763,
+              -0.03019449,
+              0.009107182,
+              -0.044254936,
+              0.04843456,
+              0.117205575,
+              -0.009833911,
+              0.0023962231,
+              0.09339494,
+              -0.059902366,
+              0.0101377955,
+              -0.03777244,
+              -0.04344207,
+              -0.14677393,
+              -0.022666233,
+              -0.008934328,
+              -0.02157697,
+              -0.021902358,
+              -0.06611372,
+              0.016243221,
+              0.062620856,
+              0.01056146,
+              0.04721975,
+              -0.087221384,
+              0.009420561,
+              -0.017691165,
+              -0.03847053,
+              0.010398396,
+              0.022942957,
+              0.099518456,
+              -0.021421565,
+              0.0016765085,
+              -0.039359514,
+              0.01641369,
+              0.039669517,
+              -0.119695365,
+              0.009885617,
+              0.003855461,
+              0.018273395,
+              -0.0454586,
+              0.0020496584,
+              0.024263415,
+              0.016978405,
+              0.06884217,
+              -0.027432522,
+              -0.01813802,
+              0.053840507,
+              -0.028815664,
+              -0.045221787,
+              0.11472852,
+              0.019796453,
+              -0.05785514,
+              0.016556906,
+              -0.07362942,
+              0.04025756,
+              -0.01510899,
+              0.0067040483,
+              -0.049666926,
+              0.045941774,
+              0.077951804,
+              -0.042951427,
+              0.021852365,
+              0.063826546,
+              0.08110754,
+              -0.070652775,
+              -0.03245094,
+              0.09259784,
+              -0.020451743,
+              0.0701599,
+              -0.020740295,
+              0.09339449,
+              -0.051164806,
+              0.039440546,
+              0.02560772,
+              -1.6767814e-08,
+              0.001529873,
+              0.0080792755,
+              -0.017666567,
+              -0.034070052,
+              0.06805411,
+              0.07387949,
+              -0.07592055,
+              -0.11369049,
+              -0.022008128,
+              0.009088418,
+              0.03108134,
+              -0.0056734695,
+              -0.0462051,
+              0.0037219985,
+              0.013269294,
+              -0.03213892,
+              -0.05557376,
+              -0.010602884,
+              0.006751397,
+              -0.025462827,
+              -0.0836812,
+              0.08886153,
+              0.005159859,
+              -0.051621262,
+              -0.051873572,
+              0.039706588,
+              -0.042155124,
+              0.057125967,
+              0.088910565,
+              0.049736783,
+              0.04144574,
+              0.094677895,
+              -0.037107926,
+              -0.06845684,
+              -0.061673928,
+              0.09891817,
+              -0.05952751,
+              -0.0331722,
+              -0.026014913,
+              0.077612035,
+              0.056150436,
+              0.010709955,
+              0.018974187,
+              0.056079865,
+              -0.041700333,
+              -0.02731697,
+              0.10184176,
+              -0.036189064,
+              -0.029914921,
+              -0.043333948,
+              0.043660097,
+              0.018800316,
+              -0.0042763646,
+              0.055898346,
+              -0.0034344571,
+              0.060258396,
+              -0.1337251,
+              0.008184424,
+              -0.031549457,
+              0.022398692,
+              0.037932154,
+              0.024529235,
+              0.068037644,
+              0.07021777
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/417020320684.json b/tests/integration/recordings/responses/417020320684.json
index 56ddea6aa..73f1e4238 100644
--- a/tests/integration/recordings/responses/417020320684.json
+++ b/tests/integration/recordings/responses/417020320684.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.06384743,
-              0.013436034,
-              -0.054533605,
-              0.011913119,
-              -0.074255615,
-              -0.13346045,
-              0.04293264,
-              0.045415178,
-              -0.069499195,
-              -0.03594047,
-              0.012013141,
-              0.0068701585,
-              0.088894635,
-              0.0025958198,
-              0.03248322,
-              -0.00781389,
-              -0.05045716,
-              0.0066499636,
-              0.02780642,
-              -0.1278895,
-              0.00061722804,
-              0.04524771,
-              -0.036062278,
-              0.044238217,
-              0.012931149,
-              -0.009267752,
-              0.011908537,
-              0.026050908,
-              0.020050693,
-              -0.033657826,
-              -0.028060015,
-              0.08754526,
-              0.059001748,
-              0.053905424,
-              0.020296838,
-              0.06843132,
-              -0.031828973,
-              -0.08757766,
-              -0.11278083,
-              0.022646705,
-              -0.09042749,
-              -0.0033280335,
-              -0.04013833,
-              -0.03408772,
-              -0.032974605,
-              0.029246835,
-              -0.03902113,
-              0.045517426,
-              -0.0331051,
-              -0.006541718,
-              -0.09631428,
-              -0.011705091,
-              -0.052590065,
-              -0.064790964,
-              0.03107029,
-              -0.012614695,
-              0.0973954,
-              0.0052277497,
-              -0.035061166,
-              -0.14041117,
-              -0.06678556,
-              0.03656035,
-              -0.039271023,
-              0.070130296,
-              -0.001007227,
-              -0.026842492,
-              -0.017554138,
-              0.030476976,
-              0.0640168,
-              -0.03162716,
-              -0.1459817,
-              -0.04540497,
-              -0.018482737,
-              0.06690258,
-              0.030561155,
-              -0.12253459,
-              0.06106281,
-              -0.05676725,
-              -0.005102081,
-              -0.008781471,
-              0.0065009934,
-              -0.016409436,
-              -0.033660814,
-              0.084904715,
-              -0.000299427,
-              -0.073421866,
-              0.038623117,
-              0.15695204,
-              0.010100481,
-              0.025317656,
-              -0.0021393092,
-              -0.046127863,
-              0.062426485,
-              -0.019896954,
-              -0.054696236,
-              0.097949564,
-              0.038487267,
-              -0.072427474,
-              -0.038710196,
-              0.07158003,
-              0.0073204385,
-              -0.051196836,
-              0.031370413,
-              -0.032227658,
-              0.03930787,
-              -0.009667071,
-              0.06993779,
-              -0.052014988,
-              0.049430363,
-              -0.04273174,
-              -0.003752437,
-              -0.041564792,
-              -0.056199003,
-              -0.033390746,
-              0.05104195,
-              0.038621522,
-              -0.002969481,
-              0.08187672,
-              -0.0035807535,
-              0.045314044,
-              0.0068791825,
-              0.016496154,
-              0.016330697,
-              0.007280202,
-              -0.021685049,
-              -0.004648767,
-              -0.007916633,
-              -4.153803e-33,
-              -0.045814347,
-              -0.050876923,
-              -0.038647644,
-              0.010091659,
-              0.0700144,
-              -0.025181346,
-              0.10506424,
-              -0.0049788426,
-              -0.0641887,
-              -0.047635607,
-              0.012736192,
-              0.051960304,
-              -0.0160108,
-              0.08172301,
-              0.023975011,
-              -0.02088898,
-              0.04570414,
-              0.09154945,
-              0.025109906,
-              0.019044904,
-              0.048153024,
-              0.097932264,
-              0.034160685,
-              0.035437047,
-              0.0114016645,
-              -0.043437798,
-              -0.0041986653,
-              -0.055648174,
-              0.011477498,
-              0.0071031414,
-              -0.06427046,
-              -0.02060021,
-              -0.004527582,
-              -0.012953201,
-              0.026594209,
-              -0.012370914,
-              0.008425176,
-              -0.06823755,
-              0.046840925,
-              -0.041645527,
-              -0.025629306,
-              -0.0038959885,
-              0.050076205,
-              -0.008090696,
-              -0.023280276,
-              0.023890443,
-              0.0015592615,
-              0.04615769,
-              -0.06899702,
-              0.041591667,
-              0.0045278594,
-              -0.047615696,
-              0.054234404,
-              0.06972373,
-              -0.016879166,
-              0.04805917,
-              0.012710964,
-              0.0022028312,
-              -0.00632154,
-              -0.03153454,
-              0.02372792,
-              0.06859583,
-              0.07721348,
-              -0.012276763,
-              0.039006572,
-              0.03434665,
-              0.030310014,
-              0.058712285,
-              0.08029841,
-              0.06976497,
-              -0.09046315,
-              0.02376487,
-              -0.008737595,
-              0.038339745,
-              -0.027534455,
-              0.02316122,
-              0.027078442,
-              -0.081344925,
-              -0.010344974,
-              0.04727033,
-              -0.020315375,
-              -0.025998361,
-              -0.017408848,
-              -0.0035885328,
-              -0.018698875,
-              -0.0374002,
-              0.041077297,
-              0.05317115,
-              -0.00557377,
-              -0.058558866,
-              -0.07202089,
-              -0.0750218,
-              0.04825297,
-              0.011333554,
-              -0.022591913,
-              1.3509705e-33,
-              0.006217277,
-              0.03161211,
-              -0.036121942,
-              -0.0016698099,
-              -0.08257381,
-              -0.060688194,
-              0.059951965,
-              0.014476651,
-              0.05951137,
-              0.027058002,
-              -0.0116078025,
-              -0.05761336,
-              0.103633516,
-              -0.0028178988,
-              0.07695233,
-              0.019430202,
-              -0.052228313,
-              0.015157555,
-              -0.001314194,
-              0.027793957,
-              -0.11528974,
-              0.047293015,
-              -0.075984485,
-              -0.07435121,
-              -0.029174728,
-              -0.020066952,
-              -0.03471861,
-              -0.057671476,
-              -0.030140208,
-              0.047475602,
-              0.0122009255,
-              0.011492795,
-              -0.051974766,
-              0.059714273,
-              0.03282909,
-              0.0013831124,
-              0.0577218,
-              -0.04120374,
-              -0.021517176,
-              -0.0067665633,
-              0.14197157,
-              0.057943344,
-              0.010075872,
-              0.096026145,
-              0.014512136,
-              0.021362338,
-              -0.07552857,
-              0.07883896,
-              -0.042723794,
-              -0.06604244,
-              -0.03871113,
-              -0.008144072,
-              0.014999539,
-              -0.049409784,
-              -0.037078433,
-              -0.023772687,
-              0.03742616,
-              0.008203275,
-              -0.08696922,
-              -0.05963844,
-              -0.07733288,
-              -0.056535304,
-              0.029040048,
-              0.007370859,
-              -0.07786975,
-              0.0025485628,
-              -0.10403352,
-              -0.04738507,
-              -0.015877869,
-              -0.11589796,
-              0.09726567,
-              0.0049555353,
-              -0.010271941,
-              0.0066397907,
-              -0.060328998,
-              0.025491165,
-              -0.052938554,
-              -0.0038485127,
-              -0.050254337,
-              0.07681007,
-              0.046079025,
-              0.0074015437,
-              0.0047005047,
-              0.07386609,
-              -0.077935226,
-              0.001350664,
-              0.01371514,
-              0.056624677,
-              0.021921877,
-              0.0072018835,
-              0.0076770596,
-              0.1022247,
-              0.06007294,
-              0.036791492,
-              -0.03775615,
-              -1.1873974e-08,
-              -0.008835198,
-              0.017599683,
-              0.0622159,
-              0.03203167,
-              -0.011572803,
-              0.051924217,
-              -0.011727461,
-              -0.06392444,
-              -0.029854134,
-              0.03257704,
-              0.005516639,
-              -0.012049206,
-              -0.054406274,
-              -0.056717165,
-              -0.030638915,
-              0.14277336,
-              0.028553458,
-              -0.028731374,
-              0.019938445,
-              0.025647435,
-              0.07379124,
-              -0.006680472,
-              0.0061455644,
-              0.09610866,
-              -0.0880125,
-              -0.00892061,
-              0.038242683,
-              0.04831363,
-              0.018802335,
-              -0.10537713,
-              0.048258167,
-              -0.022250284,
-              0.020506755,
-              0.014618206,
-              0.03079222,
-              -0.029113656,
-              0.008291428,
-              -0.045047753,
-              0.002552782,
-              0.02174108,
-              -0.0081180185,
-              0.009036818,
-              -0.013369313,
-              -0.014042713,
-              0.06843612,
-              0.045168996,
-              -0.034600396,
-              -0.07275618,
-              -0.0041681295,
-              -0.05823282,
-              -0.03303698,
-              0.0040505864,
-              -0.020017866,
-              -0.020105122,
-              0.05537091,
-              0.102509096,
-              -0.10799596,
-              -0.013787153,
-              -0.009659191,
-              0.015613784,
-              -0.031229256,
-              0.13294649,
-              0.15243623,
-              -0.022428894
+              -0.063880146,
+              0.013411989,
+              -0.054502595,
+              0.01193493,
+              -0.074262686,
+              -0.13344447,
+              0.04294062,
+              0.045387108,
+              -0.06949706,
+              -0.035939943,
+              0.01200873,
+              0.0068830596,
+              0.08886977,
+              0.0026030506,
+              0.032482542,
+              -0.007821568,
+              -0.05044649,
+              0.006662123,
+              0.027794942,
+              -0.12791364,
+              0.00062353734,
+              0.045270294,
+              -0.03605076,
+              0.044243146,
+              0.0129354475,
+              -0.0092799105,
+              0.011904844,
+              0.026060482,
+              0.020055141,
+              -0.03368774,
+              -0.028043076,
+              0.087557025,
+              0.059002083,
+              0.053893365,
+              0.02027196,
+              0.06840361,
+              -0.03180594,
+              -0.087597735,
+              -0.11277839,
+              0.022651086,
+              -0.09037903,
+              -0.0033202847,
+              -0.040132593,
+              -0.034084503,
+              -0.032953303,
+              0.02925268,
+              -0.03903928,
+              0.04551951,
+              -0.0331016,
+              -0.006518362,
+              -0.09629851,
+              -0.011739161,
+              -0.052575007,
+              -0.064773224,
+              0.031043475,
+              -0.012586444,
+              0.09737276,
+              0.005224713,
+              -0.035071153,
+              -0.1404299,
+              -0.06678175,
+              0.03654573,
+              -0.039277818,
+              0.07014256,
+              -0.0010227569,
+              -0.026846789,
+              -0.0175696,
+              0.03044068,
+              0.06403526,
+              -0.031643596,
+              -0.14598879,
+              -0.045400888,
+              -0.018469285,
+              0.06689445,
+              0.030553635,
+              -0.12255281,
+              0.061046645,
+              -0.05678168,
+              -0.005118667,
+              -0.0087622,
+              0.006514719,
+              -0.016424034,
+              -0.033650044,
+              0.08491301,
+              -0.00029260007,
+              -0.07339515,
+              0.038627055,
+              0.15695965,
+              0.010035773,
+              0.025318887,
+              -0.0021428047,
+              -0.04613549,
+              0.06244243,
+              -0.019905778,
+              -0.05471386,
+              0.09796629,
+              0.0384793,
+              -0.072424814,
+              -0.038704097,
+              0.07158691,
+              0.007360897,
+              -0.05120446,
+              0.0313513,
+              -0.032230332,
+              0.039326303,
+              -0.009643992,
+              0.069905065,
+              -0.052026685,
+              0.049440835,
+              -0.04272916,
+              -0.0037707465,
+              -0.04155246,
+              -0.0561972,
+              -0.03340213,
+              0.05105359,
+              0.038616214,
+              -0.0029470131,
+              0.08188407,
+              -0.0035886324,
+              0.04530431,
+              0.0068888925,
+              0.016499842,
+              0.016347302,
+              0.007283021,
+              -0.021663606,
+              -0.0046215886,
+              -0.007931065,
+              -4.1536508e-33,
+              -0.045777988,
+              -0.050903402,
+              -0.038634304,
+              0.0100991195,
+              0.070007294,
+              -0.025182785,
+              0.1050647,
+              -0.0049731904,
+              -0.064141616,
+              -0.047639705,
+              0.012718577,
+              0.05198462,
+              -0.016051587,
+              0.08170543,
+              0.024008816,
+              -0.020879291,
+              0.045706064,
+              0.091577366,
+              0.02512945,
+              0.019055998,
+              0.048144504,
+              0.097951256,
+              0.034154113,
+              0.03543114,
+              0.011410896,
+              -0.043446988,
+              -0.0041784984,
+              -0.05564714,
+              0.01147717,
+              0.0071039577,
+              -0.06426582,
+              -0.020623188,
+              -0.0045247558,
+              -0.012943628,
+              0.02658834,
+              -0.012385487,
+              0.008399212,
+              -0.06824828,
+              0.04683057,
+              -0.04165085,
+              -0.025662417,
+              -0.0038799767,
+              0.05007075,
+              -0.008117481,
+              -0.023308154,
+              0.023914568,
+              0.0015741173,
+              0.046142872,
+              -0.06898886,
+              0.041611847,
+              0.0045286645,
+              -0.047628563,
+              0.054236773,
+              0.06972688,
+              -0.016889753,
+              0.04806098,
+              0.012714234,
+              0.0022186628,
+              -0.006355918,
+              -0.031550523,
+              0.023726372,
+              0.06859327,
+              0.077228814,
+              -0.01227583,
+              0.03901903,
+              0.034360897,
+              0.03032876,
+              0.058690928,
+              0.08030179,
+              0.06976231,
+              -0.09047136,
+              0.02376998,
+              -0.008751518,
+              0.038334776,
+              -0.02751323,
+              0.023137644,
+              0.027101006,
+              -0.08135271,
+              -0.010334998,
+              0.04730408,
+              -0.02033998,
+              -0.026008504,
+              -0.017415512,
+              -0.0035714875,
+              -0.018727385,
+              -0.037389226,
+              0.041064497,
+              0.05317889,
+              -0.0055602547,
+              -0.058561854,
+              -0.072036326,
+              -0.075019896,
+              0.04825644,
+              0.011348427,
+              -0.02259257,
+              1.3515749e-33,
+              0.006240622,
+              0.031606406,
+              -0.036119435,
+              -0.0016494404,
+              -0.08255665,
+              -0.06069396,
+              0.059934463,
+              0.014492232,
+              0.059514895,
+              0.027053975,
+              -0.011601325,
+              -0.057609312,
+              0.10365583,
+              -0.002784741,
+              0.07693759,
+              0.019432511,
+              -0.052210074,
+              0.015158053,
+              -0.0012768542,
+              0.027789148,
+              -0.115292676,
+              0.047323048,
+              -0.07599195,
+              -0.074344486,
+              -0.029194841,
+              -0.020079462,
+              -0.034749795,
+              -0.05769437,
+              -0.0301632,
+              0.04749987,
+              0.012206333,
+              0.011497502,
+              -0.051970575,
+              0.05972769,
+              0.03281016,
+              0.0013676677,
+              0.057720944,
+              -0.041179247,
+              -0.02150875,
+              -0.0067487382,
+              0.1419711,
+              0.05795878,
+              0.010094941,
+              0.09603845,
+              0.014521089,
+              0.02133803,
+              -0.07551916,
+              0.07887724,
+              -0.04273237,
+              -0.06601746,
+              -0.038729392,
+              -0.008161129,
+              0.015012324,
+              -0.049418066,
+              -0.037083283,
+              -0.02378242,
+              0.03743137,
+              0.008194503,
+              -0.086978436,
+              -0.05960285,
+              -0.07732487,
+              -0.056507926,
+              0.029065313,
+              0.0073954053,
+              -0.077878684,
+              0.0026059505,
+              -0.10405392,
+              -0.04738624,
+              -0.015872862,
+              -0.11591199,
+              0.09724705,
+              0.0049243565,
+              -0.010273523,
+              0.0066429917,
+              -0.060295314,
+              0.02550513,
+              -0.052950058,
+              -0.0038489713,
+              -0.050250847,
+              0.07679287,
+              0.046089787,
+              0.007386997,
+              0.0046740095,
+              0.07385862,
+              -0.07792065,
+              0.0013675193,
+              0.013730894,
+              0.05658653,
+              0.021934126,
+              0.007195913,
+              0.0076705213,
+              0.10221154,
+              0.060060997,
+              0.036779005,
+              -0.037765697,
+              -1.187368e-08,
+              -0.00885571,
+              0.01760442,
+              0.062224448,
+              0.032051455,
+              -0.011581793,
+              0.051908698,
+              -0.011685676,
+              -0.06391574,
+              -0.029866237,
+              0.03258576,
+              0.0055078953,
+              -0.012040446,
+              -0.054406017,
+              -0.056690563,
+              -0.030638037,
+              0.14276367,
+              0.028526368,
+              -0.028743364,
+              0.019917691,
+              0.025652615,
+              0.073813364,
+              -0.0066998666,
+              0.0061508445,
+              0.09610696,
+              -0.08799916,
+              -0.0089272335,
+              0.03823298,
+              0.04832936,
+              0.018829934,
+              -0.10534708,
+              0.048226915,
+              -0.02225069,
+              0.020491786,
+              0.014641141,
+              0.030794447,
+              -0.029119467,
+              0.008283775,
+              -0.04506887,
+              0.0025344177,
+              0.021756247,
+              -0.008108281,
+              0.00904927,
+              -0.013340866,
+              -0.014037631,
+              0.06845187,
+              0.045173325,
+              -0.034587316,
+              -0.07275669,
+              -0.004159724,
+              -0.058231864,
+              -0.033032075,
+              0.0040235794,
+              -0.019985583,
+              -0.020122562,
+              0.055365406,
+              0.10250875,
+              -0.10799118,
+              -0.013780294,
+              -0.009652406,
+              0.015592658,
+              -0.031221472,
+              0.1329332,
+              0.15243866,
+              -0.022426173
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/4420515208a8.json b/tests/integration/recordings/responses/4420515208a8.json
index 4d43b3fb8..779593849 100644
--- a/tests/integration/recordings/responses/4420515208a8.json
+++ b/tests/integration/recordings/responses/4420515208a8.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.07471535,
-              0.08136051,
-              -0.0646403,
-              0.011820692,
-              -0.074530184,
-              0.02182932,
-              0.077565186,
-              0.012791591,
-              0.05854512,
-              -0.014144753,
-              0.054007743,
-              -0.026551379,
-              -0.018058892,
-              -0.060439672,
-              -0.019246193,
-              -0.0065063615,
-              -0.047261372,
-              -0.048988443,
-              -0.0904866,
-              -0.066554815,
-              0.09284568,
-              0.021294983,
-              -0.013393054,
-              -0.0066470345,
-              0.008009612,
-              0.016829057,
-              0.039714802,
-              0.021865955,
-              0.014889775,
-              -0.039430078,
-              0.025233349,
-              -0.036833033,
-              0.016638417,
-              0.008795953,
-              -0.05348616,
-              0.0361554,
-              -0.034618407,
-              -0.009877053,
-              0.064839765,
-              -0.015148702,
-              0.020900138,
-              -0.07136567,
-              -0.008516019,
-              0.051174764,
-              -0.06211658,
-              0.059481908,
-              -0.047928233,
-              0.07046077,
-              -0.024866259,
-              -0.010772497,
-              0.06539378,
-              -0.03691645,
-              -0.08241172,
-              0.081707805,
-              0.017110538,
-              0.0129555175,
-              -0.047113538,
-              0.0025686903,
-              0.008714549,
-              0.09987858,
-              0.0496949,
-              -0.025898866,
-              -0.017353507,
-              0.03393223,
-              0.038376898,
-              -0.054239143,
-              0.00860024,
-              -0.040809266,
-              0.02656175,
-              -0.071856335,
-              -0.019946808,
-              -0.041174017,
-              -0.07246157,
-              0.00040759498,
-              0.018743936,
-              0.023058625,
-              0.0166551,
-              -0.063356385,
-              0.034956083,
-              0.05005474,
-              0.00041865162,
-              -0.06177827,
-              0.006278017,
-              0.11141626,
-              0.0040813377,
-              0.08571246,
-              0.023260446,
-              0.057005797,
-              -0.03149278,
-              -0.013331491,
-              -0.04513824,
-              -0.11731193,
-              0.0160608,
-              -0.016902346,
-              -0.028950376,
-              0.03577902,
-              -0.051558092,
-              0.03297068,
-              -0.11266136,
-              0.06640369,
-              0.037849367,
-              0.022930682,
-              0.05809001,
-              -0.03963197,
-              -0.03245654,
-              0.01767903,
-              -0.005010206,
-              0.019044327,
-              0.07743703,
-              -0.020407042,
-              -0.020311069,
-              -0.00953332,
-              0.003143125,
-              -0.00456264,
-              -0.02911311,
-              0.03384037,
-              0.00048523775,
-              0.06419016,
-              0.01071009,
-              0.124172516,
-              -0.0053817774,
-              0.004929672,
-              -0.059669737,
-              0.029508028,
-              -0.13410243,
-              0.016187606,
-              -0.048119176,
-              -6.608228e-33,
-              0.012317927,
-              0.060396116,
-              0.036468223,
-              -0.035990786,
-              -0.041977834,
-              0.01232469,
-              -0.08480998,
-              0.012524896,
-              0.027948672,
-              0.086107045,
-              -0.030785998,
-              -0.06136775,
-              -0.0009515558,
-              -0.025208496,
-              0.045449734,
-              -0.027582139,
-              -0.0095786555,
-              0.0067018326,
-              0.043680843,
-              -0.021498295,
-              0.003277214,
-              0.11862199,
-              0.047027264,
-              -0.13488089,
-              0.025457613,
-              -0.010294456,
-              0.0022531834,
-              -0.061856117,
-              0.10388324,
-              0.01866347,
-              -0.0017658875,
-              -0.051914714,
-              0.04644036,
-              0.037606996,
-              0.03376949,
-              0.006641087,
-              0.022004316,
-              -0.07835444,
-              -0.008207682,
-              0.027414316,
-              0.0173955,
-              -0.075223684,
-              0.006482484,
-              0.02727821,
-              0.00059299107,
-              -0.010945533,
-              -0.020044776,
-              -0.000120837554,
-              0.013701114,
-              0.004716937,
-              0.02277811,
-              0.015490094,
-              -0.0142633,
-              -0.013935009,
-              0.015847908,
-              -0.02308094,
-              0.033789054,
-              -0.039197993,
-              -0.043216396,
-              0.029982513,
-              -0.016503252,
-              0.0698185,
-              0.046076864,
-              0.053330805,
-              -0.055297256,
-              0.025112566,
-              0.014026739,
-              -0.09400958,
-              0.035901215,
-              0.029467817,
-              -0.1319919,
-              -0.0050726864,
-              -0.037837584,
-              -0.0318086,
-              -0.09549526,
-              -0.027866103,
-              0.002436243,
-              -0.007881375,
-              0.058288272,
-              -0.031986125,
-              -0.0607737,
-              -0.023380116,
-              -0.00047972053,
-              0.13766052,
-              -0.060590804,
-              -0.008125084,
-              -0.03488867,
-              -0.102469996,
-              -0.009079019,
-              -0.018955158,
-              -0.0016528872,
-              -0.07709843,
-              -0.043352164,
-              -0.03619871,
-              0.039568264,
-              3.0214064e-33,
-              0.0050480226,
-              0.00017108663,
-              -0.063063554,
-              0.012236582,
-              0.10636841,
-              0.015972469,
-              0.0066562137,
-              0.018790383,
-              -0.047090903,
-              0.04585031,
-              0.007611995,
-              0.032441676,
-              0.03210589,
-              -0.02090312,
-              0.106981054,
-              0.0075532557,
-              0.036063127,
-              0.14623925,
-              0.037788242,
-              -0.043172225,
-              -0.02176524,
-              -0.009350843,
-              -0.06982138,
-              0.015577218,
-              0.02114412,
-              0.030659605,
-              0.084352896,
-              -0.09288308,
-              0.00815284,
-              0.07806744,
-              -0.0816394,
-              0.011901701,
-              0.017101644,
-              0.0040163086,
-              -0.14144793,
-              0.0040214215,
-              0.04631442,
-              0.008958798,
-              -0.0056624487,
-              -0.055584785,
-              0.028006915,
-              0.055925272,
-              0.062281866,
-              0.0860523,
-              -0.12157215,
-              0.021931145,
-              -0.0050777225,
-              0.029814675,
-              -0.012117963,
-              0.048798613,
-              0.06408485,
-              -0.041422654,
-              0.018091682,
-              -0.028209666,
-              -0.021357967,
-              0.055625696,
-              -0.15479031,
-              0.027474454,
-              0.018845506,
-              0.04327976,
-              0.011504344,
-              0.017370872,
-              -0.023188887,
-              0.050985955,
-              0.029468553,
-              0.012529372,
-              -0.045431048,
-              -0.00222149,
-              -0.05612193,
-              -0.07891998,
-              0.0796125,
-              -0.02043551,
-              -0.076230876,
-              0.011581566,
-              -0.035624538,
-              -0.0480372,
-              -0.066065714,
-              -0.057384264,
-              -0.040163297,
-              0.071754575,
-              0.031339016,
-              0.023032097,
-              -0.023996511,
-              0.023609873,
-              0.09607155,
-              -0.06843605,
-              0.014263025,
-              0.088031664,
-              -0.037747264,
-              0.029464351,
-              -0.028663024,
-              0.10216597,
-              -0.06609628,
-              0.0228385,
-              0.04214049,
-              -1.4813483e-08,
-              0.030838875,
-              0.043892786,
-              -0.024579313,
-              -0.09817689,
-              0.0566737,
-              0.09298153,
-              -0.010350536,
-              -0.09840461,
-              0.018022444,
-              -0.0131554445,
-              0.026413994,
-              0.00880124,
-              -0.052855253,
-              -0.04217533,
-              0.030118503,
-              0.017092122,
-              -0.06243192,
-              -0.018758481,
-              -0.015982535,
-              -0.018381983,
-              -0.026471734,
-              0.010303105,
-              -0.03048123,
-              -0.08456848,
-              -0.054054197,
-              0.0100427205,
-              0.029534454,
-              0.1355571,
-              0.033424437,
-              0.12097715,
-              0.04077808,
-              0.0081999,
-              -0.018245617,
-              -0.056846414,
-              -0.12899645,
-              0.12415884,
-              -0.053460255,
-              -0.038143307,
-              0.030224878,
-              0.019799955,
-              0.047839224,
-              0.029400205,
-              0.0015434423,
-              0.06115486,
-              -0.055583358,
-              -0.030215869,
-              0.10799345,
-              -0.07073566,
-              -0.08214588,
-              0.0045075943,
-              -0.0155852465,
-              -0.013693905,
-              -0.00234985,
-              0.026380839,
-              -0.015793327,
-              0.016262477,
-              -0.040624544,
-              -0.013973127,
-              -0.08311349,
-              0.03198475,
-              0.05000169,
-              -0.0038599824,
-              0.07030323,
-              0.0049196184
+              -0.07473014,
+              0.08137506,
+              -0.06463602,
+              0.011821943,
+              -0.07454815,
+              0.021821007,
+              0.077573344,
+              0.012804661,
+              0.05853777,
+              -0.014141324,
+              0.053993534,
+              -0.026554074,
+              -0.018055506,
+              -0.060447972,
+              -0.019253474,
+              -0.006501444,
+              -0.047272332,
+              -0.048944764,
+              -0.090516366,
+              -0.06656194,
+              0.09287066,
+              0.02129739,
+              -0.013401809,
+              -0.006629013,
+              0.0079892,
+              0.016818035,
+              0.03971694,
+              0.021875564,
+              0.014873574,
+              -0.039426163,
+              0.025255844,
+              -0.036836684,
+              0.016627828,
+              0.008789532,
+              -0.053503897,
+              0.03616121,
+              -0.034633957,
+              -0.009877797,
+              0.064843215,
+              -0.01517806,
+              0.020897496,
+              -0.07135096,
+              -0.008519908,
+              0.05118655,
+              -0.062102985,
+              0.059486073,
+              -0.047937352,
+              0.07045817,
+              -0.024867272,
+              -0.010756205,
+              0.06538509,
+              -0.03693754,
+              -0.08240387,
+              0.08169191,
+              0.017090658,
+              0.012944557,
+              -0.047139525,
+              0.0025796075,
+              0.008701712,
+              0.099866174,
+              0.04969699,
+              -0.025922626,
+              -0.017354922,
+              0.03395182,
+              0.038391408,
+              -0.054247838,
+              0.008610521,
+              -0.04077977,
+              0.0265637,
+              -0.07186012,
+              -0.019953186,
+              -0.041191205,
+              -0.07246228,
+              0.00041248833,
+              0.018758524,
+              0.023036895,
+              0.01662864,
+              -0.06335885,
+              0.03495032,
+              0.050063577,
+              0.00043262896,
+              -0.06176693,
+              0.0062733325,
+              0.11142063,
+              0.0040838965,
+              0.085737824,
+              0.023284689,
+              0.05699812,
+              -0.03149832,
+              -0.013344509,
+              -0.045138564,
+              -0.117300816,
+              0.016063986,
+              -0.016894838,
+              -0.028934335,
+              0.03575864,
+              -0.05156192,
+              0.032958068,
+              -0.11266628,
+              0.06640015,
+              0.037839692,
+              0.022948038,
+              0.058071073,
+              -0.039643735,
+              -0.03247236,
+              0.017690921,
+              -0.005001274,
+              0.019046135,
+              0.07745316,
+              -0.020402163,
+              -0.020310633,
+              -0.009519755,
+              0.0031459313,
+              -0.0045639877,
+              -0.029116316,
+              0.033835515,
+              0.00050839526,
+              0.06419946,
+              0.010721198,
+              0.124151744,
+              -0.0053820186,
+              0.00491648,
+              -0.059696514,
+              0.029483523,
+              -0.13409872,
+              0.016187217,
+              -0.048092023,
+              -6.6084764e-33,
+              0.012305612,
+              0.060384244,
+              0.036461998,
+              -0.035974216,
+              -0.04197416,
+              0.012333701,
+              -0.084805995,
+              0.012502633,
+              0.02794982,
+              0.0861082,
+              -0.030791838,
+              -0.061355945,
+              -0.0009604986,
+              -0.0252044,
+              0.045444816,
+              -0.027590565,
+              -0.009594973,
+              0.006712001,
+              0.043692384,
+              -0.021483036,
+              0.003300438,
+              0.11860881,
+              0.047044385,
+              -0.1348901,
+              0.025469579,
+              -0.01029819,
+              0.0022393467,
+              -0.061863262,
+              0.10386513,
+              0.018658707,
+              -0.0017492755,
+              -0.051914047,
+              0.046442248,
+              0.03761067,
+              0.033752125,
+              0.006650237,
+              0.022015076,
+              -0.07834835,
+              -0.008209136,
+              0.027432231,
+              0.017393896,
+              -0.07524756,
+              0.006497012,
+              0.027272953,
+              0.0005804994,
+              -0.010941825,
+              -0.020050043,
+              -0.00012092298,
+              0.013705002,
+              0.004699541,
+              0.022770848,
+              0.015477994,
+              -0.0142482165,
+              -0.013953546,
+              0.015865315,
+              -0.023075614,
+              0.03379947,
+              -0.039221376,
+              -0.043229815,
+              0.02998769,
+              -0.01652291,
+              0.06981088,
+              0.04606923,
+              0.05332633,
+              -0.055300076,
+              0.02511626,
+              0.014049543,
+              -0.09398743,
+              0.03590562,
+              0.029452223,
+              -0.13200304,
+              -0.005059034,
+              -0.03784268,
+              -0.03180819,
+              -0.095502876,
+              -0.027853556,
+              0.0024331037,
+              -0.007881495,
+              0.058296,
+              -0.031999517,
+              -0.06077097,
+              -0.023381822,
+              -0.00048603877,
+              0.13765746,
+              -0.060579,
+              -0.008109843,
+              -0.034873307,
+              -0.1024547,
+              -0.009072849,
+              -0.018931676,
+              -0.0016711762,
+              -0.07710289,
+              -0.043332253,
+              -0.03619527,
+              0.03958017,
+              3.0217083e-33,
+              0.0050329794,
+              0.00016030145,
+              -0.063078895,
+              0.012225751,
+              0.10637338,
+              0.015972024,
+              0.006653195,
+              0.01880781,
+              -0.04708357,
+              0.045863643,
+              0.0076015075,
+              0.03243478,
+              0.032097474,
+              -0.020893326,
+              0.10697852,
+              0.0075498912,
+              0.036074348,
+              0.1462344,
+              0.03779065,
+              -0.043190572,
+              -0.02176097,
+              -0.009340132,
+              -0.06983617,
+              0.015578788,
+              0.021121953,
+              0.030661412,
+              0.08434581,
+              -0.09288574,
+              0.008169474,
+              0.078080945,
+              -0.081626564,
+              0.011895231,
+              0.017099649,
+              0.0040119104,
+              -0.14145434,
+              0.0040375097,
+              0.046316408,
+              0.008959473,
+              -0.0056506568,
+              -0.055587813,
+              0.028007837,
+              0.055937108,
+              0.062269785,
+              0.08602392,
+              -0.12157818,
+              0.021943888,
+              -0.0050934856,
+              0.029819332,
+              -0.012127162,
+              0.048801802,
+              0.06409215,
+              -0.041438665,
+              0.01809265,
+              -0.028214281,
+              -0.0213588,
+              0.05564267,
+              -0.1547868,
+              0.027465124,
+              0.018855799,
+              0.04327939,
+              0.011500479,
+              0.017364705,
+              -0.023216385,
+              0.051007293,
+              0.02946264,
+              0.012533944,
+              -0.04542834,
+              -0.002238765,
+              -0.05611544,
+              -0.0789272,
+              0.07960444,
+              -0.020431034,
+              -0.0762138,
+              0.011588508,
+              -0.035614885,
+              -0.04803985,
+              -0.06607436,
+              -0.057365946,
+              -0.040188126,
+              0.07176218,
+              0.03135825,
+              0.02303279,
+              -0.023997622,
+              0.023614945,
+              0.09607302,
+              -0.06843066,
+              0.014260722,
+              0.08802569,
+              -0.037736766,
+              0.029445928,
+              -0.028643936,
+              0.10217973,
+              -0.0660917,
+              0.022864237,
+              0.042151757,
+              -1.4814046e-08,
+              0.030838449,
+              0.043877687,
+              -0.0245681,
+              -0.09818859,
+              0.056659035,
+              0.0929652,
+              -0.010337853,
+              -0.0983916,
+              0.018008571,
+              -0.0131424805,
+              0.026400762,
+              0.008793538,
+              -0.05285605,
+              -0.042175982,
+              0.030133193,
+              0.01710666,
+              -0.06242493,
+              -0.018753909,
+              -0.015986755,
+              -0.018400662,
+              -0.026477808,
+              0.010281372,
+              -0.030476814,
+              -0.084556945,
+              -0.05402664,
+              0.010030052,
+              0.029531356,
+              0.13555466,
+              0.033426728,
+              0.12098221,
+              0.040777553,
+              0.008206964,
+              -0.018235989,
+              -0.0568263,
+              -0.1289943,
+              0.12416113,
+              -0.053454727,
+              -0.038151894,
+              0.030221034,
+              0.019807614,
+              0.047819767,
+              0.029434063,
+              0.0015704447,
+              0.0611775,
+              -0.05557245,
+              -0.030236417,
+              0.10799873,
+              -0.07073352,
+              -0.08215229,
+              0.004518122,
+              -0.015573616,
+              -0.013696145,
+              -0.0023438279,
+              0.026377691,
+              -0.015769389,
+              0.016251203,
+              -0.04062322,
+              -0.013962793,
+              -0.08309221,
+              0.031991288,
+              0.049991824,
+              -0.0038595141,
+              0.07031122,
+              0.0049263495
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/44a1d9de0602.json b/tests/integration/recordings/responses/44a1d9de0602.json
index 2d158a06c..d714d1334 100644
--- a/tests/integration/recordings/responses/44a1d9de0602.json
+++ b/tests/integration/recordings/responses/44a1d9de0602.json
@@ -20,7 +20,7 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-987",
+        "id": "chatcmpl-507",
         "choices": [
           {
             "finish_reason": "length",
@@ -37,7 +37,7 @@
             }
           }
         ],
-        "created": 1755294921,
+        "created": 1756921150,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
diff --git a/tests/integration/recordings/responses/44fb9cf5875f.json b/tests/integration/recordings/responses/44fb9cf5875f.json
index c7b0333f2..17c538862 100644
--- a/tests/integration/recordings/responses/44fb9cf5875f.json
+++ b/tests/integration/recordings/responses/44fb9cf5875f.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-07-31T17:59:42.166585642Z",
+        "created_at": "2025-09-03T17:41:49.581065Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 9490295253,
-        "load_duration": 42349084,
+        "total_duration": 2391571708,
+        "load_duration": 182022958,
         "prompt_eval_count": 20,
-        "prompt_eval_duration": 545470166,
+        "prompt_eval_duration": 74456583,
         "eval_count": 51,
-        "eval_duration": 8901928284,
+        "eval_duration": 2134471458,
         "response": "It seems like you're trying to test the system, but I'm not sure what specific functionality or feature you'd like to test. Could you please provide more context or clarify what you're looking for? I'll do my best to assist you!",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/48d2fb183a2a.json b/tests/integration/recordings/responses/48d2fb183a2a.json
index c8fbcb07d..1b5ee286c 100644
--- a/tests/integration/recordings/responses/48d2fb183a2a.json
+++ b/tests/integration/recordings/responses/48d2fb183a2a.json
@@ -67,15 +67,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-08-04T22:55:40.583477Z",
+        "created_at": "2025-09-03T17:36:40.283084Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 3928481500,
-        "load_duration": 151903250,
+        "total_duration": 2900042958,
+        "load_duration": 83372125,
         "prompt_eval_count": 259,
-        "prompt_eval_duration": 468000000,
+        "prompt_eval_duration": 352890750,
         "eval_count": 60,
-        "eval_duration": 3306000000,
+        "eval_duration": 2462885208,
         "response": "{\n  \"first_name\": \"Michael\",\n  \"last_name\": \"Jordan\",\n  \"year_of_birth\": 1963,\n  \"nba_stats\": {\n    \"year_for_draft\": 1984,\n    \"num_seasons_in_nba\": 15\n  }\n}",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/50340cd4d253.json b/tests/integration/recordings/responses/50340cd4d253.json
index f35923c06..3101fa9d8 100644
--- a/tests/integration/recordings/responses/50340cd4d253.json
+++ b/tests/integration/recordings/responses/50340cd4d253.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:14:19.298378Z",
+        "created_at": "2025-09-03T17:38:01.239743Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 266786083,
-        "load_duration": 53820458,
+        "total_duration": 207264667,
+        "load_duration": 73437959,
         "prompt_eval_count": 216,
-        "prompt_eval_duration": 192000000,
+        "prompt_eval_duration": 121657333,
         "eval_count": 2,
-        "eval_duration": 17000000,
+        "eval_duration": 11348417,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/5370751803dc.json b/tests/integration/recordings/responses/5370751803dc.json
index 1edae9956..af1d8efab 100644
--- a/tests/integration/recordings/responses/5370751803dc.json
+++ b/tests/integration/recordings/responses/5370751803dc.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.07649938,
-              0.021244217,
-              -0.036287725,
-              -0.0011695292,
-              -0.048568938,
-              -0.13184524,
-              -0.08424354,
-              0.059378363,
-              -0.06171173,
-              -0.009400254,
-              -0.08092405,
-              0.05547966,
-              0.05243954,
-              0.026002606,
-              0.06304219,
-              -0.062263194,
-              -0.06520713,
-              -0.022376515,
-              0.017407224,
-              -0.11619268,
-              -0.03641897,
-              0.04050772,
-              -0.032505907,
-              -0.017739171,
-              0.057254575,
-              0.012360873,
-              -0.018550506,
-              -0.029990712,
-              0.00235547,
-              0.0067841834,
-              -0.088615544,
-              0.07800687,
-              0.037015557,
-              0.029492933,
-              -0.019656634,
-              0.054334868,
-              -0.0006793985,
-              -0.08961444,
-              -0.05305694,
-              -0.012659472,
-              -0.0860912,
-              0.07697376,
-              -0.038515005,
-              -0.011632789,
-              -0.032334387,
-              -0.0075316867,
-              -0.024749892,
-              -0.068094365,
-              -0.030428912,
-              -0.02603917,
-              -0.09692951,
-              0.009892155,
-              -0.05358676,
-              -0.09094546,
-              -0.009154104,
-              -0.008819028,
-              0.048186116,
-              -0.0033502842,
-              -0.005917261,
-              -0.13302499,
-              -0.09727019,
-              0.013533918,
-              0.047219984,
-              0.062738694,
-              -0.01572617,
-              -0.037660386,
-              -0.016604222,
-              0.029844316,
-              0.093244925,
-              -0.06728843,
-              -0.13382566,
-              -0.020838322,
-              -0.025856238,
-              0.11628718,
-              0.0306645,
-              -0.10493003,
-              0.038982447,
-              -0.010721579,
-              -0.0013596424,
-              0.020682583,
-              0.0018240656,
-              0.027716527,
-              -0.078466296,
-              0.10784201,
-              0.029109064,
-              -0.05404029,
-              0.030583676,
-              0.07008342,
-              -0.03429503,
-              0.009839805,
-              0.03469849,
-              -0.042428855,
-              0.06508966,
-              0.026623009,
-              -0.032148074,
-              0.07619082,
-              0.020044614,
-              -0.030803965,
-              -0.071872465,
-              0.027219178,
-              -0.018790914,
-              -0.0541197,
-              0.07494771,
-              0.01770988,
-              0.03380063,
-              0.024214497,
-              0.09087066,
-              -0.052000217,
-              0.04061227,
-              -0.018418813,
-              -0.012485012,
-              -0.06401856,
-              -0.023183277,
-              -0.06190061,
-              0.053444423,
-              0.047886662,
-              -0.010557972,
-              0.078470305,
-              0.03581419,
-              0.02720849,
-              0.022449464,
-              -0.004947443,
-              -0.024473231,
-              0.003690138,
-              0.00033914045,
-              -0.00892056,
-              0.00927688,
-              2.0050864e-34,
-              -0.03232352,
-              -0.0242469,
-              0.02715213,
-              0.021707827,
-              0.06515407,
-              -0.019538436,
-              0.0531206,
-              0.007928102,
-              -0.039223887,
-              -0.020031622,
-              0.007848442,
-              0.02391591,
-              0.014990736,
-              0.11268782,
-              0.06107525,
-              -0.011977935,
-              0.016781967,
-              0.045509085,
-              0.0013573953,
-              0.009146736,
-              0.013215661,
-              -0.01195797,
-              0.02703829,
-              0.007053157,
-              0.022530165,
-              -0.013689941,
-              -0.004301088,
-              -0.0007768117,
-              0.033448935,
-              0.011239952,
-              -0.05143586,
-              -0.07399211,
-              -0.031036023,
-              0.019600574,
-              -0.0103345895,
-              -0.0029444918,
-              -0.0047988347,
-              -0.10445514,
-              0.034700666,
-              -0.024362778,
-              -0.0471351,
-              0.03554556,
-              0.037065983,
-              -0.016996143,
-              0.005622871,
-              0.050610665,
-              -0.008597168,
-              0.0059816362,
-              -0.12275667,
-              0.03674253,
-              -0.022365745,
-              -0.00964108,
-              0.07596107,
-              0.08905326,
-              0.016492268,
-              0.044219263,
-              0.06803503,
-              0.06454952,
-              -0.050047003,
-              -0.0017108961,
-              -0.00074994087,
-              0.09930796,
-              0.09251372,
-              -0.011378917,
-              0.050366722,
-              0.07712465,
-              0.009745006,
-              0.1009996,
-              0.03286012,
-              0.064262226,
-              -0.044561703,
-              0.038564857,
-              -0.019407123,
-              0.03742708,
-              -0.0017875227,
-              0.011954917,
-              0.01135132,
-              -0.10406638,
-              0.06980167,
-              0.019202363,
-              -0.028420014,
-              -0.0136866,
-              0.048647687,
-              -0.015362756,
-              -0.034191117,
-              -0.055556074,
-              0.0050155777,
-              0.025966194,
-              -0.0009168385,
-              -0.0042535486,
-              -0.06399157,
-              -0.059880342,
-              0.081461415,
-              0.014113321,
-              -0.038159303,
-              -2.1536519e-33,
-              -0.027272146,
-              -0.034751415,
-              -0.024606032,
-              0.026892362,
-              -0.09076156,
-              -0.045825478,
-              0.01362092,
-              0.0023044816,
-              0.054052215,
-              0.032981824,
-              -0.029818065,
-              -0.058822677,
-              0.09836217,
-              0.032525893,
-              0.110115595,
-              0.020737587,
-              -0.09583008,
-              0.0005333771,
-              0.0019376605,
-              0.017484892,
-              -0.06849545,
-              0.064435944,
-              -0.050152197,
-              -0.048923954,
-              -0.027651085,
-              -0.014845199,
-              -0.12104595,
-              -0.04417338,
-              -0.011146107,
-              0.058580566,
-              -0.007487375,
-              0.038694676,
-              -0.07034722,
-              0.030289542,
-              0.055677116,
-              -0.0011476888,
-              0.017125413,
-              -0.042026866,
-              -0.016522061,
-              -0.025752945,
-              0.11801853,
-              0.042021915,
-              0.06467938,
-              0.046182197,
-              0.015046265,
-              0.029888034,
-              -0.039066464,
-              0.087210484,
-              -0.012382869,
-              -0.035691217,
-              -0.0481768,
-              0.041446336,
-              0.03895,
-              -0.025257591,
-              -0.028859945,
-              -0.029144095,
-              0.029815607,
-              0.051508367,
-              -0.08636757,
-              -0.06916314,
-              -0.07273463,
-              -0.059568703,
-              0.00502403,
-              0.025671752,
-              -0.022013027,
-              0.024832714,
-              -0.09721394,
-              0.0063272356,
-              -0.04942868,
-              -0.13045275,
-              0.1247814,
-              -0.013577642,
-              -0.022800498,
-              0.03898444,
-              -0.07545284,
-              0.04942631,
-              0.00082998566,
-              0.004718136,
-              -0.04070612,
-              0.063641116,
-              0.11005218,
-              0.020110086,
-              -0.048857097,
-              0.05847898,
-              -0.066304415,
-              0.026930936,
-              -0.06279101,
-              -0.014113123,
-              0.023336235,
-              0.023582496,
-              -0.0020861977,
-              0.07764345,
-              0.03095139,
-              0.020153554,
-              -0.020101866,
-              -2.4304368e-08,
-              0.020170629,
-              -0.008566916,
-              0.06203045,
-              -0.0083030015,
-              0.02522894,
-              0.08902528,
-              -0.008051052,
-              -0.01893583,
-              -0.0355399,
-              0.06187224,
-              -0.017073143,
-              -0.030130422,
-              -0.10230193,
-              -0.06516148,
-              -0.004159112,
-              0.10910979,
-              -0.021820752,
-              -0.05356566,
-              0.011770625,
-              0.052257556,
-              0.058287114,
-              0.0053074392,
-              -0.05998588,
-              0.0871507,
-              -0.082790464,
-              -0.040782016,
-              0.06573996,
-              0.028298022,
-              -0.012104256,
-              -0.07195988,
-              0.014542897,
-              -0.032275774,
-              0.0027686171,
-              0.038691588,
-              0.05546941,
-              -0.015204906,
-              0.054877073,
-              -0.025119307,
-              -0.0337842,
-              0.0030478975,
-              -0.037556846,
-              0.015074203,
-              0.022833891,
-              0.012173256,
-              0.035718966,
-              0.0068811844,
-              -0.040539283,
-              -0.04956289,
-              -0.054521065,
-              -0.07317816,
-              -0.024969948,
-              -0.0021052386,
-              -0.013215133,
-              -0.06650142,
-              0.02316441,
-              0.046906833,
-              -0.13285862,
-              -0.010965043,
-              -0.024110796,
-              0.043096602,
-              0.024323147,
-              0.069191284,
-              0.15650614,
-              0.0177121
+              -0.07642644,
+              0.0213101,
+              -0.03612849,
+              -0.0012144424,
+              -0.048599217,
+              -0.13194773,
+              -0.084226094,
+              0.059389386,
+              -0.0617182,
+              -0.009323243,
+              -0.08099486,
+              0.055514984,
+              0.052610602,
+              0.026061919,
+              0.063071534,
+              -0.062316332,
+              -0.065115415,
+              -0.022351492,
+              0.017378356,
+              -0.11605584,
+              -0.036349725,
+              0.0404155,
+              -0.0325302,
+              -0.01770141,
+              0.05722761,
+              0.012393438,
+              -0.018529164,
+              -0.030017126,
+              0.002365914,
+              0.0066701965,
+              -0.08862459,
+              0.0779319,
+              0.03702611,
+              0.029523117,
+              -0.01977821,
+              0.05424799,
+              -0.00074063655,
+              -0.08949148,
+              -0.05312112,
+              -0.012703181,
+              -0.08622611,
+              0.07689996,
+              -0.038602136,
+              -0.011616902,
+              -0.03234132,
+              -0.0073969415,
+              -0.024779495,
+              -0.067999884,
+              -0.03039565,
+              -0.025974417,
+              -0.09690519,
+              0.009931951,
+              -0.05362519,
+              -0.09107193,
+              -0.009222061,
+              -0.008804084,
+              0.048185978,
+              -0.003329437,
+              -0.0058579347,
+              -0.13306528,
+              -0.09721703,
+              0.013474277,
+              0.047286008,
+              0.06279936,
+              -0.01582815,
+              -0.03771013,
+              -0.01651892,
+              0.029905442,
+              0.09326656,
+              -0.06746783,
+              -0.13385954,
+              -0.020873511,
+              -0.02586237,
+              0.11623731,
+              0.030632136,
+              -0.10494776,
+              0.03905967,
+              -0.010701787,
+              -0.0014734551,
+              0.020711906,
+              0.0017687598,
+              0.027797814,
+              -0.078500465,
+              0.10791581,
+              0.02910256,
+              -0.05398749,
+              0.030513834,
+              0.07001416,
+              -0.034323946,
+              0.00986597,
+              0.034644563,
+              -0.04232179,
+              0.065106474,
+              0.026648693,
+              -0.032122962,
+              0.07616709,
+              0.020026332,
+              -0.030642457,
+              -0.07188906,
+              0.027189687,
+              -0.018678213,
+              -0.05416582,
+              0.07488992,
+              0.017753933,
+              0.03386007,
+              0.02414506,
+              0.09077034,
+              -0.052096054,
+              0.040722203,
+              -0.018450806,
+              -0.012474094,
+              -0.06403705,
+              -0.023205942,
+              -0.061878704,
+              0.053436812,
+              0.047876816,
+              -0.010608645,
+              0.07852118,
+              0.03579911,
+              0.027097313,
+              0.022424318,
+              -0.004912598,
+              -0.02455264,
+              0.003700777,
+              0.00039888592,
+              -0.008842094,
+              0.009365857,
+              2.05052e-34,
+              -0.03236592,
+              -0.024301885,
+              0.027186498,
+              0.021633558,
+              0.06519107,
+              -0.019539308,
+              0.05306087,
+              0.007985293,
+              -0.03927361,
+              -0.020062907,
+              0.008070545,
+              0.02382429,
+              0.015006528,
+              0.1128094,
+              0.06113956,
+              -0.011911169,
+              0.016901307,
+              0.045509744,
+              0.0013988831,
+              0.00907712,
+              0.01314859,
+              -0.012022324,
+              0.027043821,
+              0.0071581583,
+              0.022573117,
+              -0.013721936,
+              -0.004378743,
+              -0.0007087661,
+              0.033585846,
+              0.011227843,
+              -0.05136015,
+              -0.0739591,
+              -0.03094639,
+              0.01957863,
+              -0.010360539,
+              -0.0029881562,
+              -0.00480912,
+              -0.10446798,
+              0.034694213,
+              -0.02424012,
+              -0.047155295,
+              0.035451673,
+              0.037169226,
+              -0.016986743,
+              0.0056092087,
+              0.05057555,
+              -0.008601115,
+              0.0060349177,
+              -0.12273999,
+              0.036871877,
+              -0.022267655,
+              -0.009739047,
+              0.075974636,
+              0.08902226,
+              0.01647873,
+              0.044345584,
+              0.06792565,
+              0.06456903,
+              -0.050189856,
+              -0.0016995457,
+              -0.00090498856,
+              0.09925942,
+              0.09253569,
+              -0.011321612,
+              0.050309792,
+              0.07697773,
+              0.0100068,
+              0.101032645,
+              0.03268899,
+              0.06433435,
+              -0.044524822,
+              0.03860177,
+              -0.019314477,
+              0.037440598,
+              -0.0017394378,
+              0.011816814,
+              0.011359969,
+              -0.1040215,
+              0.06984421,
+              0.01910163,
+              -0.028409261,
+              -0.013704911,
+              0.048502754,
+              -0.015429918,
+              -0.03423058,
+              -0.055616368,
+              0.005001686,
+              0.026054256,
+              -0.0007700968,
+              -0.0041726283,
+              -0.0640977,
+              -0.05985385,
+              0.0813829,
+              0.014288322,
+              -0.038147252,
+              -2.1576616e-33,
+              -0.027279941,
+              -0.034765568,
+              -0.02465107,
+              0.026859807,
+              -0.090699576,
+              -0.045698144,
+              0.013666582,
+              0.002109106,
+              0.054007426,
+              0.032838397,
+              -0.029939773,
+              -0.058843046,
+              0.09825693,
+              0.03251322,
+              0.109977886,
+              0.020682266,
+              -0.0958973,
+              0.0005566991,
+              0.0018037638,
+              0.017544486,
+              -0.06843023,
+              0.06435102,
+              -0.050149646,
+              -0.048880838,
+              -0.027535524,
+              -0.014993001,
+              -0.1210176,
+              -0.04412877,
+              -0.011025324,
+              0.058610573,
+              -0.007498303,
+              0.038722932,
+              -0.07025986,
+              0.030281536,
+              0.055707317,
+              -0.001162887,
+              0.01707519,
+              -0.042081844,
+              -0.016578361,
+              -0.025714336,
+              0.117893435,
+              0.04196084,
+              0.064787276,
+              0.046081997,
+              0.014950138,
+              0.030026693,
+              -0.039077066,
+              0.087156676,
+              -0.012328571,
+              -0.035646956,
+              -0.048145168,
+              0.041394625,
+              0.038984135,
+              -0.025188481,
+              -0.028836856,
+              -0.02917782,
+              0.029690607,
+              0.051454436,
+              -0.08629761,
+              -0.06921346,
+              -0.07273269,
+              -0.05952071,
+              0.0050034616,
+              0.025693603,
+              -0.022103382,
+              0.024972659,
+              -0.09724792,
+              0.0062089814,
+              -0.04963219,
+              -0.13054384,
+              0.124669954,
+              -0.01361085,
+              -0.022798477,
+              0.039057832,
+              -0.07550591,
+              0.049364913,
+              0.0007779102,
+              0.004692535,
+              -0.040757872,
+              0.06355995,
+              0.110190175,
+              0.02015945,
+              -0.048807338,
+              0.05842704,
+              -0.066375315,
+              0.026938869,
+              -0.062775925,
+              -0.014049011,
+              0.023343485,
+              0.02358394,
+              -0.002172394,
+              0.07766165,
+              0.031056313,
+              0.020171564,
+              -0.020073414,
+              -2.4317085e-08,
+              0.020261949,
+              -0.008623839,
+              0.0621209,
+              -0.008334477,
+              0.02526615,
+              0.08902315,
+              -0.007958188,
+              -0.018911751,
+              -0.035572145,
+              0.06189234,
+              -0.017249323,
+              -0.030186126,
+              -0.10225455,
+              -0.06522741,
+              -0.004033112,
+              0.10897627,
+              -0.02168822,
+              -0.053784374,
+              0.011841631,
+              0.052263785,
+              0.058334205,
+              0.0052479547,
+              -0.06017166,
+              0.08723854,
+              -0.08275336,
+              -0.040676847,
+              0.065786876,
+              0.028317772,
+              -0.012168614,
+              -0.07196286,
+              0.014588226,
+              -0.03231537,
+              0.0028357722,
+              0.03868031,
+              0.055439528,
+              -0.015238348,
+              0.05482384,
+              -0.025080629,
+              -0.033771332,
+              0.0030752022,
+              -0.037511814,
+              0.015122315,
+              0.02292684,
+              0.012024873,
+              0.03559873,
+              0.006865039,
+              -0.04049267,
+              -0.049685854,
+              -0.05455341,
+              -0.073071465,
+              -0.024902396,
+              -0.002133957,
+              -0.013212662,
+              -0.06657236,
+              0.023245512,
+              0.046919,
+              -0.13278763,
+              -0.011092663,
+              -0.023939205,
+              0.043182902,
+              0.024406029,
+              0.06922961,
+              0.15658055,
+              0.017658537
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/545d86510a80.json b/tests/integration/recordings/responses/545d86510a80.json
index 8126fd241..7cd718d56 100644
--- a/tests/integration/recordings/responses/545d86510a80.json
+++ b/tests/integration/recordings/responses/545d86510a80.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.59711Z",
+          "created_at": "2025-09-03T17:42:32.625862Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.671294Z",
+          "created_at": "2025-09-03T17:42:32.668885Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.736161Z",
+          "created_at": "2025-09-03T17:42:32.710947Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.809857Z",
+          "created_at": "2025-09-03T17:42:32.752286Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.883599Z",
+          "created_at": "2025-09-03T17:42:32.793309Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.942471Z",
+          "created_at": "2025-09-03T17:42:32.834578Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.999844Z",
+          "created_at": "2025-09-03T17:42:32.876536Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:39.050862Z",
+          "created_at": "2025-09-03T17:42:32.918807Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:39.104589Z",
+          "created_at": "2025-09-03T17:42:32.960101Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:39.158301Z",
+          "created_at": "2025-09-03T17:42:33.00196Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:39.210985Z",
+          "created_at": "2025-09-03T17:42:33.043876Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:39.263525Z",
+          "created_at": "2025-09-03T17:42:33.08756Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,15 +238,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:39.314455Z",
+          "created_at": "2025-09-03T17:42:33.12966Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 914060542,
-          "load_duration": 63705209,
+          "total_duration": 648814958,
+          "load_duration": 75300875,
           "prompt_eval_count": 408,
-          "prompt_eval_duration": 95000000,
+          "prompt_eval_duration": 66740291,
           "eval_count": 13,
-          "eval_duration": 753000000,
+          "eval_duration": 505313125,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/554de3cd986f.json b/tests/integration/recordings/responses/554de3cd986f.json
index 990de1928..7a359c50e 100644
--- a/tests/integration/recordings/responses/554de3cd986f.json
+++ b/tests/integration/recordings/responses/554de3cd986f.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.40585Z",
+          "created_at": "2025-09-03T17:37:51.805591Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.455647Z",
+          "created_at": "2025-09-03T17:37:51.850067Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.509581Z",
+          "created_at": "2025-09-03T17:37:51.892443Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.56592Z",
+          "created_at": "2025-09-03T17:37:51.934364Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.616979Z",
+          "created_at": "2025-09-03T17:37:51.978382Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.671413Z",
+          "created_at": "2025-09-03T17:37:52.019332Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.725494Z",
+          "created_at": "2025-09-03T17:37:52.060708Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.779905Z",
+          "created_at": "2025-09-03T17:37:52.102717Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.829791Z",
+          "created_at": "2025-09-03T17:37:52.143996Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.880729Z",
+          "created_at": "2025-09-03T17:37:52.185479Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.93338Z",
+          "created_at": "2025-09-03T17:37:52.227562Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:04.981714Z",
+          "created_at": "2025-09-03T17:37:52.270178Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,7 +238,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:05.036068Z",
+          "created_at": "2025-09-03T17:37:52.31151Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -256,7 +256,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:05.088069Z",
+          "created_at": "2025-09-03T17:37:52.35278Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -274,7 +274,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:05.144485Z",
+          "created_at": "2025-09-03T17:37:52.393954Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -292,7 +292,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:05.203042Z",
+          "created_at": "2025-09-03T17:37:52.435238Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -310,7 +310,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:05.257133Z",
+          "created_at": "2025-09-03T17:37:52.476197Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -328,7 +328,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:05.311623Z",
+          "created_at": "2025-09-03T17:37:52.517914Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -346,15 +346,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:05.370124Z",
+          "created_at": "2025-09-03T17:37:52.55904Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1532801458,
-          "load_duration": 213911041,
+          "total_duration": 971882292,
+          "load_duration": 116634209,
           "prompt_eval_count": 376,
-          "prompt_eval_duration": 350000000,
+          "prompt_eval_duration": 99382958,
           "eval_count": 19,
-          "eval_duration": 967000000,
+          "eval_duration": 755260750,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/561746e1c8de.json b/tests/integration/recordings/responses/561746e1c8de.json
index 120f40661..1bb8a3345 100644
--- a/tests/integration/recordings/responses/561746e1c8de.json
+++ b/tests/integration/recordings/responses/561746e1c8de.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:49.18651486Z",
+          "created_at": "2025-09-03T17:36:20.465701Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:49.370611348Z",
+          "created_at": "2025-09-03T17:36:20.507671Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:49.557000029Z",
+          "created_at": "2025-09-03T17:36:20.549443Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:49.746777116Z",
+          "created_at": "2025-09-03T17:36:20.590803Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:49.942233333Z",
+          "created_at": "2025-09-03T17:36:20.631683Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:50.126788846Z",
+          "created_at": "2025-09-03T17:36:20.672443Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:50.311346131Z",
+          "created_at": "2025-09-03T17:36:20.713329Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:50.501507173Z",
+          "created_at": "2025-09-03T17:36:20.754254Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:50.692296777Z",
+          "created_at": "2025-09-03T17:36:20.795119Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:50.878846539Z",
+          "created_at": "2025-09-03T17:36:20.836145Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,15 +201,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-15T20:24:51.063200561Z",
+          "created_at": "2025-09-03T17:36:20.877784Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 33982453650,
-          "load_duration": 2909001805,
+          "total_duration": 612057417,
+          "load_duration": 97443583,
           "prompt_eval_count": 341,
-          "prompt_eval_duration": 29194357307,
+          "prompt_eval_duration": 100914750,
           "eval_count": 11,
-          "eval_duration": 1878247732,
+          "eval_duration": 413024250,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/563b994bb7d1.json b/tests/integration/recordings/responses/563b994bb7d1.json
index 9f3354cfa..62e38dc5c 100644
--- a/tests/integration/recordings/responses/563b994bb7d1.json
+++ b/tests/integration/recordings/responses/563b994bb7d1.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-08-04T22:55:13.25248Z",
+        "created_at": "2025-09-03T17:36:19.594923Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 1344654917,
-        "load_duration": 200585375,
+        "total_duration": 988472417,
+        "load_duration": 117976625,
         "prompt_eval_count": 326,
-        "prompt_eval_duration": 564000000,
+        "prompt_eval_duration": 451625542,
         "eval_count": 11,
-        "eval_duration": 578000000,
+        "eval_duration": 418313417,
         "response": "[get_weather(location=\"San Francisco, CA\")]",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/5f5d16afadb4.json b/tests/integration/recordings/responses/5f5d16afadb4.json
index 8b4061494..f93d688c4 100644
--- a/tests/integration/recordings/responses/5f5d16afadb4.json
+++ b/tests/integration/recordings/responses/5f5d16afadb4.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.354888Z",
+          "created_at": "2025-09-03T17:36:19.808372Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.427569Z",
+          "created_at": "2025-09-03T17:36:19.84991Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.486244Z",
+          "created_at": "2025-09-03T17:36:19.892111Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.540455Z",
+          "created_at": "2025-09-03T17:36:19.933857Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.594439Z",
+          "created_at": "2025-09-03T17:36:19.975148Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.649837Z",
+          "created_at": "2025-09-03T17:36:20.016641Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.703358Z",
+          "created_at": "2025-09-03T17:36:20.058229Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.7553Z",
+          "created_at": "2025-09-03T17:36:20.100222Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.807251Z",
+          "created_at": "2025-09-03T17:36:20.143456Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.857952Z",
+          "created_at": "2025-09-03T17:36:20.184657Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,15 +201,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:13.918522Z",
+          "created_at": "2025-09-03T17:36:20.226017Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 647785042,
-          "load_duration": 26355584,
+          "total_duration": 598395375,
+          "load_duration": 129432167,
           "prompt_eval_count": 326,
-          "prompt_eval_duration": 55000000,
+          "prompt_eval_duration": 50057334,
           "eval_count": 11,
-          "eval_duration": 557000000,
+          "eval_duration": 418284791,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/62aa454ea5f9.json b/tests/integration/recordings/responses/62aa454ea5f9.json
index 1e74bbbbb..38b8ffd3b 100644
--- a/tests/integration/recordings/responses/62aa454ea5f9.json
+++ b/tests/integration/recordings/responses/62aa454ea5f9.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.08570448,
-              -0.095600754,
-              0.04398704,
-              -0.016002586,
-              0.02937856,
-              0.07229825,
-              -0.0108823925,
-              -0.023841137,
-              0.073795915,
-              -0.057006016,
-              -0.033788595,
-              0.051158767,
-              0.0050739567,
-              0.014298775,
-              -0.07881352,
-              -0.012878745,
-              -0.041616067,
-              0.06878784,
-              -0.10782497,
-              -0.040376976,
-              0.026258128,
-              -0.001976873,
-              -0.011027494,
-              -0.0019720662,
-              0.0040587694,
-              0.088816345,
-              0.014071338,
-              -0.018417818,
-              0.032645598,
-              -0.034702033,
-              0.076144606,
-              -0.014125607,
-              -0.02493309,
-              0.03755479,
-              -0.10195466,
-              0.05470191,
-              -0.022550134,
-              0.024206808,
-              0.011727895,
-              -0.008955921,
-              -0.050100796,
-              0.0026504535,
-              0.05590394,
-              0.009941025,
-              0.12794785,
-              -0.025010481,
-              0.02435104,
-              -0.024520388,
-              -0.0022285185,
-              -0.024684334,
-              -0.104818396,
-              -0.059973124,
-              -0.055206526,
-              0.015273937,
-              0.034947917,
-              0.05265324,
-              -0.00064814935,
-              0.06637618,
-              -0.031795718,
-              -0.0072964546,
-              -0.0050489027,
-              -0.042481057,
-              -0.04087265,
-              0.02008772,
-              0.03870467,
-              0.022511596,
-              -0.028690359,
-              0.053362943,
-              0.022450354,
-              0.019296993,
-              0.12269906,
-              0.023923857,
-              -0.03728355,
-              0.005889267,
-              0.052346867,
-              0.054002233,
-              0.08020592,
-              -0.010999822,
-              0.029368848,
-              -0.06721461,
-              -0.0002297595,
-              -0.050588466,
-              -0.0095366035,
-              0.046173498,
-              0.07868036,
-              0.014159739,
-              -0.03324329,
-              0.0018601778,
-              -0.066629566,
-              -0.020975014,
-              -0.017125193,
-              -0.043948952,
-              -0.059707303,
-              -0.073459946,
-              -0.039868142,
-              -0.030861603,
-              -0.019913651,
-              -0.10752571,
-              -0.02664692,
-              0.0689932,
-              -0.0049655125,
-              0.026640149,
-              0.018917048,
-              0.022118697,
-              0.06419974,
-              -0.053135265,
-              0.061616186,
-              0.014025234,
-              0.11771526,
-              -0.05178239,
-              -0.07634793,
-              0.030905172,
-              -0.03857174,
-              -0.025236985,
-              0.039299082,
-              -0.06143655,
-              0.008370295,
-              0.016200868,
-              0.03228489,
-              0.066803135,
-              -0.06503229,
-              0.014640972,
-              -0.038513865,
-              0.018730285,
-              -0.03011228,
-              -0.028523602,
-              -0.14709216,
-              -3.454768e-33,
-              -0.04858036,
-              -0.024983805,
-              0.071692064,
-              0.03562587,
-              0.07928956,
-              -0.07811275,
-              0.02311943,
-              -0.047469147,
-              0.08866776,
-              -0.0009905098,
-              -0.11322911,
-              0.09129462,
-              0.023959681,
-              0.11371455,
-              0.042178337,
-              -0.057762112,
-              -0.07452438,
-              -0.0021433395,
-              -0.051525325,
-              -0.05095998,
-              -0.0016218564,
-              0.030707737,
-              0.04509054,
-              -0.039753992,
-              -0.058684282,
-              -0.03064905,
-              0.0017237811,
-              0.009109253,
-              -0.013751708,
-              0.023424868,
-              0.0017645947,
-              0.046604484,
-              -0.07229431,
-              -0.027867278,
-              0.016140861,
-              0.04446358,
-              -0.004325922,
-              -0.06178838,
-              0.06979857,
-              0.031267133,
-              -0.013667371,
-              -0.0074066212,
-              0.031622607,
-              -0.0236915,
-              0.07152246,
-              0.023948636,
-              0.009776826,
-              0.0071919537,
-              -0.03232169,
-              -0.049612403,
-              -0.050260104,
-              0.02150285,
-              0.015312771,
-              -0.06745535,
-              0.06546945,
-              -0.025536334,
-              0.03208605,
-              0.020402592,
-              0.011268207,
-              0.00021468061,
-              -0.02349139,
-              -0.004954465,
-              -0.014090667,
-              0.0014277936,
-              0.059316903,
-              0.039940886,
-              -0.032523617,
-              -0.023729,
-              0.05446682,
-              0.06422314,
-              -0.034017127,
-              0.08744712,
-              -0.08048706,
-              -0.090565994,
-              -0.06538303,
-              -0.00010127551,
-              -0.021434912,
-              -0.068461135,
-              -0.029138267,
-              0.03413734,
-              -0.07802728,
-              -0.05389643,
-              -0.035581492,
-              0.044851534,
-              -0.040098358,
-              0.07973631,
-              0.026042009,
-              -0.081827834,
-              0.0017979769,
-              -0.02764713,
-              -0.04310408,
-              -0.04207307,
-              0.08336723,
-              -0.0494554,
-              -0.09028882,
-              2.6716478e-33,
-              -0.091917306,
-              0.026388643,
-              -0.07020338,
-              0.075572066,
-              0.039003927,
-              0.027942013,
-              -0.054444574,
-              -0.036634557,
-              -0.048207656,
-              0.07556485,
-              0.046478804,
-              0.025872312,
-              0.05219267,
-              -0.00020983674,
-              0.010589843,
-              -0.040604923,
-              -0.028473163,
-              -0.02054734,
-              0.08885036,
-              -0.067588866,
-              0.04945189,
-              0.13227695,
-              -0.06998917,
-              -0.040121764,
-              0.044024557,
-              0.03420703,
-              -0.08647228,
-              0.057482626,
-              -0.007488546,
-              0.04904739,
-              -0.014908641,
-              -0.018117905,
-              -0.020271562,
-              0.03883485,
-              0.022270914,
-              0.13485505,
-              0.06897264,
-              -0.0026128246,
-              -0.016425159,
-              0.0033841128,
-              0.017271666,
-              0.013608802,
-              0.044169303,
-              0.049203753,
-              -0.008237051,
-              -0.04662037,
-              -0.04390372,
-              0.041557033,
-              -0.0354663,
-              0.04278537,
-              0.031310573,
-              0.017929101,
-              -0.02624033,
-              -0.0545814,
-              -0.042623743,
-              -0.004118359,
-              0.029068246,
-              0.001052956,
-              0.09042771,
-              0.014050165,
-              -0.06879308,
-              -0.071003124,
-              0.020317351,
-              0.004283492,
-              -0.046952303,
-              0.016503377,
-              -0.028376328,
-              0.1043668,
-              0.0028236075,
-              -0.08338905,
-              0.03736013,
-              0.058911674,
-              0.037606813,
-              0.09578536,
-              -0.12376857,
-              -0.054084644,
-              -0.014489054,
-              0.0013207535,
-              -0.04531095,
-              -0.089944325,
-              0.0017439555,
-              -0.05519527,
-              0.00056134106,
-              0.0005587594,
-              0.07862233,
-              0.104556754,
-              0.0035775604,
-              0.008373316,
-              0.04291439,
-              0.010107487,
-              0.025184723,
-              0.057374246,
-              -0.023012979,
-              0.054407477,
-              -0.049804952,
-              -1.32878e-08,
-              -0.053895604,
-              0.08075507,
-              0.03399497,
-              0.024384415,
-              0.090608515,
-              -0.07165007,
-              0.07552621,
-              0.017241832,
-              -0.061231323,
-              -0.03297735,
-              0.07829615,
-              0.0396499,
-              -0.03669638,
-              0.026653878,
-              0.10006404,
-              -0.014379535,
-              0.02066834,
-              -0.039198436,
-              0.008517119,
-              -0.0012403574,
-              0.06739532,
-              0.014030484,
-              -0.054005865,
-              -0.016788486,
-              0.076489784,
-              -0.035523314,
-              -0.050076444,
-              0.083784595,
-              -0.00999262,
-              0.081417,
-              0.019268963,
-              0.049931277,
-              0.0022461978,
-              -0.07805938,
-              0.01945713,
-              0.11157225,
-              -0.012694483,
-              -0.064655006,
-              -0.09344128,
-              -0.04999159,
-              -0.042193726,
-              0.059935458,
-              0.034836538,
-              -0.014958905,
-              0.014489057,
-              -0.022633748,
-              0.06917315,
-              -0.08858699,
-              0.02150387,
-              0.013796807,
-              -0.007545836,
-              0.027875464,
-              0.015522231,
-              0.0052421056,
-              0.01061417,
-              -0.022906043,
-              -0.025388915,
-              -0.04141604,
-              -0.08376164,
-              0.09259756,
-              0.051795125,
-              0.09296195,
-              0.0111989025,
-              -0.01673378
+              -0.08566708,
+              -0.09559047,
+              0.044014607,
+              -0.015974598,
+              0.029406257,
+              0.07229597,
+              -0.010901963,
+              -0.023829829,
+              0.07381301,
+              -0.05698464,
+              -0.033780586,
+              0.051200844,
+              0.0050912783,
+              0.014317088,
+              -0.07878143,
+              -0.012908666,
+              -0.041628323,
+              0.06881713,
+              -0.10783476,
+              -0.04042705,
+              0.026262026,
+              -0.0019893218,
+              -0.011008084,
+              -0.0019646112,
+              0.004033132,
+              0.08881656,
+              0.014049165,
+              -0.018416086,
+              0.032621212,
+              -0.034692146,
+              0.07614942,
+              -0.014122101,
+              -0.024901746,
+              0.03755059,
+              -0.10197354,
+              0.054705318,
+              -0.022539826,
+              0.024209768,
+              0.011698194,
+              -0.008956377,
+              -0.050146304,
+              0.0026327297,
+              0.055942897,
+              0.009974366,
+              0.12796965,
+              -0.025006283,
+              0.024338534,
+              -0.024487961,
+              -0.0022703854,
+              -0.024687177,
+              -0.10482094,
+              -0.05994297,
+              -0.055200897,
+              0.0152664175,
+              0.03496896,
+              0.052624088,
+              -0.0006445885,
+              0.06637695,
+              -0.031790398,
+              -0.007308742,
+              -0.0050764186,
+              -0.042508755,
+              -0.04089097,
+              0.020062948,
+              0.038683955,
+              0.022463562,
+              -0.02866933,
+              0.053370677,
+              0.022435635,
+              0.01934692,
+              0.12264713,
+              0.023911418,
+              -0.037264284,
+              0.0059156846,
+              0.05235448,
+              0.054004095,
+              0.08022169,
+              -0.010992806,
+              0.029295033,
+              -0.0672064,
+              -0.00021147476,
+              -0.050584126,
+              -0.0095251575,
+              0.04616498,
+              0.078677796,
+              0.01416309,
+              -0.033226117,
+              0.0018380182,
+              -0.06667651,
+              -0.020977372,
+              -0.017116925,
+              -0.04396714,
+              -0.05969979,
+              -0.07344942,
+              -0.03985366,
+              -0.030863814,
+              -0.019918729,
+              -0.1075161,
+              -0.026654154,
+              0.0689854,
+              -0.0049292273,
+              0.026645623,
+              0.018879393,
+              0.022113768,
+              0.064208575,
+              -0.053153764,
+              0.06160797,
+              0.014026719,
+              0.11772326,
+              -0.051769163,
+              -0.07634968,
+              0.03090975,
+              -0.038558383,
+              -0.025260162,
+              0.039262023,
+              -0.061449137,
+              0.008389126,
+              0.016175874,
+              0.032293033,
+              0.06679397,
+              -0.06503257,
+              0.014676881,
+              -0.038542666,
+              0.018718671,
+              -0.030111106,
+              -0.028481327,
+              -0.14707623,
+              -3.455443e-33,
+              -0.048577547,
+              -0.024983348,
+              0.071679614,
+              0.035652317,
+              0.07931413,
+              -0.07811974,
+              0.023085583,
+              -0.047467884,
+              0.08872273,
+              -0.0010074769,
+              -0.11320135,
+              0.091322996,
+              0.023978539,
+              0.11368158,
+              0.042203873,
+              -0.05773289,
+              -0.074543044,
+              -0.0021036167,
+              -0.051522236,
+              -0.050925426,
+              -0.0016557347,
+              0.030671587,
+              0.045119714,
+              -0.03974729,
+              -0.05871358,
+              -0.030611658,
+              0.0017253247,
+              0.009114429,
+              -0.013763352,
+              0.023424039,
+              0.0017495834,
+              0.046633217,
+              -0.07230643,
+              -0.027882291,
+              0.016182518,
+              0.044456217,
+              -0.004326421,
+              -0.061798126,
+              0.0697968,
+              0.031249145,
+              -0.013697079,
+              -0.007417679,
+              0.031665757,
+              -0.02367961,
+              0.07153089,
+              0.023938214,
+              0.009729952,
+              0.0071919435,
+              -0.03235391,
+              -0.04955071,
+              -0.050248373,
+              0.02151118,
+              0.015327139,
+              -0.0674203,
+              0.06544387,
+              -0.025547959,
+              0.03207046,
+              0.02038825,
+              0.0112230005,
+              0.00019493286,
+              -0.023462659,
+              -0.004949742,
+              -0.014066955,
+              0.0014178518,
+              0.059315395,
+              0.039931085,
+              -0.032498423,
+              -0.023698896,
+              0.05445033,
+              0.064231694,
+              -0.034013335,
+              0.08745776,
+              -0.080473825,
+              -0.090545714,
+              -0.065398656,
+              -8.2386265e-05,
+              -0.021441188,
+              -0.0684535,
+              -0.029121745,
+              0.034134887,
+              -0.07799698,
+              -0.05388711,
+              -0.035591345,
+              0.044826802,
+              -0.040090464,
+              0.07972004,
+              0.026058797,
+              -0.08184859,
+              0.0018106091,
+              -0.027676936,
+              -0.04312832,
+              -0.042090744,
+              0.08336437,
+              -0.049453646,
+              -0.0902778,
+              2.6716498e-33,
+              -0.091911495,
+              0.02641473,
+              -0.07022486,
+              0.075562105,
+              0.03900905,
+              0.027913846,
+              -0.05444872,
+              -0.036666486,
+              -0.048225258,
+              0.07551892,
+              0.046452336,
+              0.025874302,
+              0.052248206,
+              -0.00018527219,
+              0.010575236,
+              -0.040591337,
+              -0.028484622,
+              -0.020559357,
+              0.08882296,
+              -0.06755767,
+              0.04941752,
+              0.13231009,
+              -0.06998129,
+              -0.040112328,
+              0.044030365,
+              0.034218542,
+              -0.08650528,
+              0.05746921,
+              -0.0075130556,
+              0.049070083,
+              -0.0148686,
+              -0.018103259,
+              -0.020280316,
+              0.038828347,
+              0.022253176,
+              0.13486238,
+              0.06899369,
+              -0.002589861,
+              -0.016430879,
+              0.0033818923,
+              0.017275693,
+              0.013614936,
+              0.044220798,
+              0.049155377,
+              -0.008259856,
+              -0.046575654,
+              -0.043921605,
+              0.04156687,
+              -0.035468902,
+              0.042837795,
+              0.03131579,
+              0.017961076,
+              -0.026213305,
+              -0.05458616,
+              -0.04259084,
+              -0.004110002,
+              0.029035388,
+              0.0010451805,
+              0.09044077,
+              0.014110149,
+              -0.068820216,
+              -0.07098938,
+              0.020328037,
+              0.00433692,
+              -0.046977337,
+              0.016492791,
+              -0.028396707,
+              0.104340956,
+              0.002814702,
+              -0.08339559,
+              0.037326302,
+              0.058929898,
+              0.0376423,
+              0.09580634,
+              -0.12376848,
+              -0.054060236,
+              -0.014485116,
+              0.0013106487,
+              -0.04537336,
+              -0.0899294,
+              0.001730278,
+              -0.05520831,
+              0.000568523,
+              0.00053380145,
+              0.07856981,
+              0.104590714,
+              0.00355283,
+              0.008365939,
+              0.04291482,
+              0.010064388,
+              0.025177509,
+              0.05732803,
+              -0.023061136,
+              0.054399785,
+              -0.049828697,
+              -1.3290186e-08,
+              -0.0539168,
+              0.08074109,
+              0.03397028,
+              0.024365881,
+              0.0906225,
+              -0.07162824,
+              0.07550329,
+              0.017278913,
+              -0.061226364,
+              -0.03298407,
+              0.07829606,
+              0.03967995,
+              -0.036696997,
+              0.02665964,
+              0.1000655,
+              -0.014426734,
+              0.020708792,
+              -0.039230846,
+              0.0085029,
+              -0.0012509917,
+              0.06740856,
+              0.013992665,
+              -0.054007422,
+              -0.016785627,
+              0.07651403,
+              -0.035508703,
+              -0.050085396,
+              0.08382383,
+              -0.009957674,
+              0.08140875,
+              0.019287178,
+              0.049911316,
+              0.0022236605,
+              -0.07807412,
+              0.019454133,
+              0.111560374,
+              -0.01269702,
+              -0.06466137,
+              -0.09346588,
+              -0.050038446,
+              -0.042178612,
+              0.0599713,
+              0.034831088,
+              -0.014957726,
+              0.014484159,
+              -0.022619838,
+              0.06916277,
+              -0.088544875,
+              0.021478733,
+              0.01378541,
+              -0.0075770007,
+              0.027888266,
+              0.015526889,
+              0.0052174823,
+              0.010616002,
+              -0.022908956,
+              -0.02535865,
+              -0.04139556,
+              -0.08375561,
+              0.092626974,
+              0.051755503,
+              0.09296614,
+              0.011223383,
+              -0.016759252
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/6906a6e71988.json b/tests/integration/recordings/responses/6906a6e71988.json
index 9d4125823..6574cab53 100644
--- a/tests/integration/recordings/responses/6906a6e71988.json
+++ b/tests/integration/recordings/responses/6906a6e71988.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:14:18.886381Z",
+        "created_at": "2025-09-03T17:38:00.98692Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 488566500,
-        "load_duration": 113477291,
+        "total_duration": 332473583,
+        "load_duration": 90611333,
         "prompt_eval_count": 317,
-        "prompt_eval_duration": 361000000,
+        "prompt_eval_duration": 229691000,
         "eval_count": 2,
-        "eval_duration": 12000000,
+        "eval_duration": 11571291,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/6cc063bbd7d3.json b/tests/integration/recordings/responses/6cc063bbd7d3.json
index 2e7841626..ab6e12602 100644
--- a/tests/integration/recordings/responses/6cc063bbd7d3.json
+++ b/tests/integration/recordings/responses/6cc063bbd7d3.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:55.9885Z",
+          "created_at": "2025-09-03T17:42:17.402486Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.054143Z",
+          "created_at": "2025-09-03T17:42:17.444334Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.117658Z",
+          "created_at": "2025-09-03T17:42:17.484625Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.179422Z",
+          "created_at": "2025-09-03T17:42:17.525063Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.240328Z",
+          "created_at": "2025-09-03T17:42:17.565015Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.295992Z",
+          "created_at": "2025-09-03T17:42:17.60499Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.355683Z",
+          "created_at": "2025-09-03T17:42:17.64509Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.412176Z",
+          "created_at": "2025-09-03T17:42:17.685566Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.466952Z",
+          "created_at": "2025-09-03T17:42:17.725855Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.517222Z",
+          "created_at": "2025-09-03T17:42:17.766056Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,7 +201,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.570491Z",
+          "created_at": "2025-09-03T17:42:17.806415Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -219,7 +219,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.623189Z",
+          "created_at": "2025-09-03T17:42:17.847273Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -237,7 +237,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.679221Z",
+          "created_at": "2025-09-03T17:42:17.888576Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -255,7 +255,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.731373Z",
+          "created_at": "2025-09-03T17:42:17.928952Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -273,7 +273,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.781364Z",
+          "created_at": "2025-09-03T17:42:17.969744Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -291,7 +291,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.831951Z",
+          "created_at": "2025-09-03T17:42:18.010869Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -309,7 +309,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.888381Z",
+          "created_at": "2025-09-03T17:42:18.051109Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -327,7 +327,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.943539Z",
+          "created_at": "2025-09-03T17:42:18.093266Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -345,7 +345,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:56.997422Z",
+          "created_at": "2025-09-03T17:42:18.135749Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -363,15 +363,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:57.056259Z",
+          "created_at": "2025-09-03T17:42:18.176649Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1289815458,
-          "load_duration": 119745583,
+          "total_duration": 907420000,
+          "load_duration": 66756750,
           "prompt_eval_count": 26,
-          "prompt_eval_duration": 98000000,
+          "prompt_eval_duration": 62900875,
           "eval_count": 20,
-          "eval_duration": 1071000000,
+          "eval_duration": 777306958,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/6d35c91287e2.json b/tests/integration/recordings/responses/6d35c91287e2.json
index 699493f45..a7af894e8 100644
--- a/tests/integration/recordings/responses/6d35c91287e2.json
+++ b/tests/integration/recordings/responses/6d35c91287e2.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.362667Z",
+          "created_at": "2025-09-03T17:38:03.549266Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.427435Z",
+          "created_at": "2025-09-03T17:38:03.592203Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.484198Z",
+          "created_at": "2025-09-03T17:38:03.63417Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.537031Z",
+          "created_at": "2025-09-03T17:38:03.677268Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.591198Z",
+          "created_at": "2025-09-03T17:38:03.719768Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.643336Z",
+          "created_at": "2025-09-03T17:38:03.762204Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.698589Z",
+          "created_at": "2025-09-03T17:38:03.80404Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.752904Z",
+          "created_at": "2025-09-03T17:38:03.845678Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.804Z",
+          "created_at": "2025-09-03T17:38:03.887086Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.855633Z",
+          "created_at": "2025-09-03T17:38:03.928422Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.906918Z",
+          "created_at": "2025-09-03T17:38:03.969641Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:22.958729Z",
+          "created_at": "2025-09-03T17:38:04.011212Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,15 +238,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:23.011279Z",
+          "created_at": "2025-09-03T17:38:04.052626Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 793500292,
-          "load_duration": 55339750,
+          "total_duration": 731936583,
+          "load_duration": 147334791,
           "prompt_eval_count": 417,
-          "prompt_eval_duration": 83000000,
+          "prompt_eval_duration": 79443792,
           "eval_count": 13,
-          "eval_duration": 653000000,
+          "eval_duration": 504352750,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/6f96090aa955.json b/tests/integration/recordings/responses/6f96090aa955.json
index d5131d389..d0ac20442 100644
--- a/tests/integration/recordings/responses/6f96090aa955.json
+++ b/tests/integration/recordings/responses/6f96090aa955.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -21,7 +21,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -36,7 +36,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081849,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -47,7 +47,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -62,7 +62,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081849,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -73,11 +73,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
-                "content": " Welcome",
+                "content": " It",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -88,7 +88,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081849,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -99,7 +99,59 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
+          "choices": [
+            {
+              "delta": {
+                "content": "'s",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921359,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-698",
+          "choices": [
+            {
+              "delta": {
+                "content": " nice",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921359,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -114,7 +166,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081849,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -125,11 +177,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
-                "content": " our",
+                "content": " meet",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -140,7 +192,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081849,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -151,11 +203,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
-                "content": " conversation",
+                "content": " you",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -166,7 +218,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081849,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -177,7 +229,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -192,7 +244,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081849,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -203,7 +255,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -218,7 +270,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -229,7 +281,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -244,7 +296,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -255,7 +307,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -270,7 +322,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -281,7 +333,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -296,7 +348,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -307,7 +359,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -322,7 +374,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -333,7 +385,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -348,7 +400,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -359,7 +411,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -374,7 +426,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -385,7 +437,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -400,7 +452,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -411,33 +463,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
-          "choices": [
-            {
-              "delta": {
-                "content": ",",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081850,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -452,7 +478,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -463,7 +489,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -478,7 +504,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921359,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -489,7 +515,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -504,7 +530,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921360,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -515,7 +541,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -530,7 +556,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921360,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -541,7 +567,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -556,7 +582,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921360,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -567,7 +593,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -582,7 +608,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921360,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -593,7 +619,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -608,7 +634,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921360,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -619,7 +645,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-333",
+          "id": "chatcmpl-698",
           "choices": [
             {
               "delta": {
@@ -634,7 +660,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081850,
+          "created": 1756921360,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/6fbea1abca7c.json b/tests/integration/recordings/responses/6fbea1abca7c.json
index 576fc7de1..c16fe1268 100644
--- a/tests/integration/recordings/responses/6fbea1abca7c.json
+++ b/tests/integration/recordings/responses/6fbea1abca7c.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.337763Z",
+          "created_at": "2025-09-03T17:38:01.89965Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.394358Z",
+          "created_at": "2025-09-03T17:38:01.941253Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.451349Z",
+          "created_at": "2025-09-03T17:38:01.982621Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.504443Z",
+          "created_at": "2025-09-03T17:38:02.024144Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.555779Z",
+          "created_at": "2025-09-03T17:38:02.065495Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.607807Z",
+          "created_at": "2025-09-03T17:38:02.107529Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.660627Z",
+          "created_at": "2025-09-03T17:38:02.149217Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.711562Z",
+          "created_at": "2025-09-03T17:38:02.190357Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.761822Z",
+          "created_at": "2025-09-03T17:38:02.231501Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.81712Z",
+          "created_at": "2025-09-03T17:38:02.272546Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.868755Z",
+          "created_at": "2025-09-03T17:38:02.313561Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.921049Z",
+          "created_at": "2025-09-03T17:38:02.354563Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,7 +238,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:20.973584Z",
+          "created_at": "2025-09-03T17:38:02.395585Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -256,7 +256,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:21.030707Z",
+          "created_at": "2025-09-03T17:38:02.436854Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -274,7 +274,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:21.082015Z",
+          "created_at": "2025-09-03T17:38:02.47814Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -292,7 +292,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:21.132945Z",
+          "created_at": "2025-09-03T17:38:02.519661Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -310,7 +310,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:21.187452Z",
+          "created_at": "2025-09-03T17:38:02.561119Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -328,7 +328,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:21.239827Z",
+          "created_at": "2025-09-03T17:38:02.602821Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -346,15 +346,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:21.294154Z",
+          "created_at": "2025-09-03T17:38:02.644633Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1929211666,
-          "load_duration": 61298666,
+          "total_duration": 1375629459,
+          "load_duration": 94090250,
           "prompt_eval_count": 386,
-          "prompt_eval_duration": 908000000,
+          "prompt_eval_duration": 535119167,
           "eval_count": 19,
-          "eval_duration": 959000000,
+          "eval_duration": 745684041,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/6fe1d4fedf12.json b/tests/integration/recordings/responses/6fe1d4fedf12.json
index 733c7bd55..8fd079a85 100644
--- a/tests/integration/recordings/responses/6fe1d4fedf12.json
+++ b/tests/integration/recordings/responses/6fe1d4fedf12.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -24,7 +24,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -39,7 +39,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228961,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -50,11 +50,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " don",
+                "content": "'m",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -65,7 +65,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228961,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -76,11 +76,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": "'t",
+                "content": " not",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -91,7 +91,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228961,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -102,11 +102,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " have",
+                "content": " able",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -117,7 +117,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228961,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -128,85 +128,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " real",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228961,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "-time",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228961,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " access",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228961,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -221,7 +143,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228962,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -232,215 +154,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " current",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " weather",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " conditions",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ".",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " However",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ",",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " I",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " can",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -455,7 +169,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228962,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -466,11 +180,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " you",
+                "content": " real",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -481,7 +195,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228962,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -492,11 +206,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " with",
+                "content": "-time",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -507,7 +221,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228962,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -518,189 +232,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " information",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " on",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " typical",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " climate",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " of",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Tokyo",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -715,7 +247,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228962,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -726,215 +258,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " suggest",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " ways",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " for",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " you",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228962,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " to",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " find",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " out",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -949,7 +273,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228963,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -960,7 +284,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -975,7 +299,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228963,
+          "created": 1756921324,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -986,11 +310,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": ".\n\n",
+                "content": " information",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1001,7 +325,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228963,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1012,657 +336,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "Tok",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "yo",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " has",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " a",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " humid",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " subt",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "ropical",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " climate",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ",",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " characterized",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " by",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " hot",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " and",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " humid",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " summers",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ",",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " mild",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228963,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " winters",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ",",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " and",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " moderate",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " spring",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " and",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " autumn",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " seasons",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -1677,7 +351,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228964,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1688,11 +362,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " Here",
+                "content": " However",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1703,7 +377,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228964,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1714,527 +388,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "'s",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " a",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " general",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " idea",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " of",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " what",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " you",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " might",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " expect",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ":\n\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "*",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Summer",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " (",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "June",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " to",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228964,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " August",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "):",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Hot",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " and",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " humid",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -2249,7 +403,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228965,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -2260,1957 +414,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " with",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " temperatures",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " often",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " reaching",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " ",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "30",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\u00b0C",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " (",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "86",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\u00b0F",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ")",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " or",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " higher",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ".\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "*",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Autumn",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " (",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "September",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228965,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " to",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " November",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "):",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Mild",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ",",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " with",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " temperatures",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " ranging",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " from",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " ",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "10",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\u00b0C",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " (",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "50",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\u00b0F",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ")",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " to",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " ",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "20",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\u00b0C",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " (",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "68",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\u00b0F",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ").\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228966,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "*",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Spring",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " (",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "March",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " to",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " May",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ")",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " and",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Winter",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " (",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "December",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " to",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " February",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "):",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Cool",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " and",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " sometimes",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " rainy",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ".\n\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "If",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " you",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " need",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " up",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "-to",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228967,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "-date",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " information",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " on",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " current",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " weather",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " in",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Tokyo",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ",",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -4225,7 +429,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228968,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -4236,683 +440,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " recommend",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " checking",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " a",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " reliable",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " online",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " weather",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " source",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " such",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " as",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": ":\n\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "-",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Acc",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "u",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "Weather",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228968,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "-",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " BBC",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Weather",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "-",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " The",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Weather",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " Channel",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "\n\n",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": "Or",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
-          "choices": [
-            {
-              "delta": {
-                "content": " you",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1755228969,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -4927,7 +455,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -4938,11 +466,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " check",
+                "content": " tell",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -4953,7 +481,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -4964,11 +492,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " local",
+                "content": " you",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -4979,7 +507,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -4990,11 +518,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " news",
+                "content": " that",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5005,7 +533,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5016,11 +544,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " websites",
+                "content": " Tokyo",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5031,7 +559,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5042,11 +570,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " or",
+                "content": " has",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5057,7 +585,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5068,11 +596,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " mobile",
+                "content": " a",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5083,7 +611,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5094,11 +622,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " apps",
+                "content": " humid",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5109,7 +637,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5120,11 +648,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " for",
+                "content": " subt",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5135,7 +663,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5146,11 +674,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " the",
+                "content": "ropical",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5161,7 +689,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5172,11 +700,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " latest",
+                "content": " climate",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5187,7 +715,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5198,11 +726,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
-                "content": " forecast",
+                "content": " with",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -5213,7 +741,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228969,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5224,7 +752,111 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " hot",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921325,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " and",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921325,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " humid",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921325,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " summers",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921325,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -5239,7 +871,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228970,
+          "created": 1756921325,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -5250,7 +882,4843 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-381",
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Here",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921325,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "'s",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921325,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " an",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " overview",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " typical",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " seasonal",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " weather",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " patterns",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ":\n\n",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "1",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " **",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "Spring",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "March",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " May",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")**",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ":",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Mild",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " temperatures",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ranging",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " from",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921326,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "15",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "59",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "20",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "68",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "),",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " with",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " gentle",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " humidity",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".\n\n",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "2",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " **",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "Summer",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "June",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921327,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " August",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")**",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ":",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Hot",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " and",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " humid",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " with",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " temperatures",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " generally",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " between",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "25",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "77",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " and",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "35",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "95",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921328,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ").",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Heat",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "waves",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " are",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " common",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " during",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " this",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " period",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".\n\n",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "3",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " **",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "Aut",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "umn",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "September",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " November",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")**",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ":",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Comfort",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "able",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " temperatures",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921329,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " about",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "15",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "59",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "20",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "68",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "),",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " making",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " it",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " a",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " lovely",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " season",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " for",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " sight",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "seeing",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921330,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".\n\n",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "4",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " **",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "Winter",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "December",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " February",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")**",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ":",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Cool",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " and",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " relatively",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " dry",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " with",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " average",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " temperatures",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ranging",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " from",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " -",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "2",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921331,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "28",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ")",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "10",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0C",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "50",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u00b0F",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ").\n\n",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "To",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " get",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " current",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " weather",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " in",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Tokyo",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " I",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " recommend",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " checking",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " online",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " resources",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921332,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " such",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " as",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Acc",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "u",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "Weather",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Weather",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".com",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " or",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": " Met",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "e",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": "ors",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921333,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-358",
           "choices": [
             {
               "delta": {
@@ -5265,7 +5733,7 @@
               "logprobs": null
             }
           ],
-          "created": 1755228970,
+          "created": 1756921333,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/70adef2c30c4.json b/tests/integration/recordings/responses/70adef2c30c4.json
index c17f21631..f8f3ce7df 100644
--- a/tests/integration/recordings/responses/70adef2c30c4.json
+++ b/tests/integration/recordings/responses/70adef2c30c4.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-08-04T22:55:55.720345Z",
+        "created_at": "2025-09-03T17:42:17.227488Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 3865701084,
-        "load_duration": 52435459,
+        "total_duration": 3003964916,
+        "load_duration": 111221916,
         "prompt_eval_count": 30,
-        "prompt_eval_duration": 99000000,
+        "prompt_eval_duration": 72578583,
         "eval_count": 70,
-        "eval_duration": 3712000000,
+        "eval_duration": 2819555375,
         "response": "The answer is Saturn! Saturn's ring system is one of the most iconic and well-known in our solar system. The rings are made up of ice particles, rock debris, and dust that orbit around the planet due to its gravitational pull.\n\nWould you like to know more about Saturn's rings or is there something else I can help you with?",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/72c1126ff2f9.json b/tests/integration/recordings/responses/72c1126ff2f9.json
index b474c7e21..f50c68953 100644
--- a/tests/integration/recordings/responses/72c1126ff2f9.json
+++ b/tests/integration/recordings/responses/72c1126ff2f9.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.024362812,
-              0.016713308,
-              0.03763492,
-              -0.009156733,
-              -0.030551745,
-              -0.017125947,
-              0.07426094,
-              0.045657348,
-              -0.0093097305,
-              0.009920903,
-              -0.005690781,
-              0.0076895193,
-              0.039548296,
-              0.015248784,
-              -0.083151944,
-              0.019454934,
-              -0.02207085,
-              -0.033246633,
-              -0.1810784,
-              -0.1302997,
-              -0.0022484967,
-              0.013480844,
-              -0.024304103,
-              -0.03698983,
-              0.001961629,
-              0.08568096,
-              0.004767316,
-              -0.0034146819,
-              -0.0060834372,
-              -0.11571087,
-              0.06683183,
-              -0.01873301,
-              0.08783993,
-              -0.0074664783,
-              -0.09357002,
-              0.061450087,
-              -0.0810802,
-              0.012219781,
-              0.039706405,
-              -0.002647126,
-              -0.046620198,
-              -0.081851535,
-              0.039566126,
-              0.015464555,
-              0.043695353,
-              0.10368333,
-              -0.058397062,
-              0.03668824,
-              -0.052697357,
-              0.04057381,
-              -0.12580334,
-              0.0065060873,
-              -0.035828654,
-              -0.010048116,
-              -0.023825277,
-              0.045975305,
-              0.014622974,
-              0.019410197,
-              0.028452095,
-              -0.05502182,
-              0.024185732,
-              -0.052869923,
-              0.015245502,
-              -0.00438015,
-              0.09234898,
-              0.033873633,
-              -0.047367375,
-              0.032001555,
-              0.0013095026,
-              -0.051196218,
-              0.025864813,
-              0.081560105,
-              0.040911082,
-              0.019192263,
-              0.056467537,
-              -0.052748967,
-              0.030553715,
-              -0.016636984,
-              0.07878182,
-              -0.054208696,
-              -0.042150352,
-              -0.045420144,
-              -0.05269096,
-              0.11224785,
-              0.019874783,
-              -0.0423623,
-              -0.011692426,
-              0.024343297,
-              0.01916104,
-              -0.016559148,
-              -0.010328452,
-              -0.085476756,
-              0.02384857,
-              -0.042118136,
-              -0.024980163,
-              0.062104426,
-              -0.004581602,
-              -0.15367238,
-              0.001102325,
-              0.19421555,
-              -0.03386706,
-              0.026160223,
-              -0.020320892,
-              0.0012947157,
-              -0.0010485641,
-              -0.024099724,
-              0.017537115,
-              -0.009841853,
-              0.070402764,
-              -0.13768643,
-              -0.111146465,
-              -0.017362772,
-              0.06603636,
-              -0.051869333,
-              0.0019475558,
-              0.014572362,
-              0.060779307,
-              0.09626945,
-              0.0135371,
-              0.019355945,
-              -8.543184e-05,
-              -0.026694054,
-              -0.009353406,
-              0.07085975,
-              -0.0034419452,
-              -0.062405273,
-              -0.044579133,
-              -8.80938e-34,
-              -0.11187708,
-              -0.04253664,
-              0.027483786,
-              0.06572092,
-              0.0028295182,
-              -0.044070996,
-              0.0052582966,
-              -0.036901183,
-              -0.015558772,
-              0.020610636,
-              -0.059269626,
-              0.0072413837,
-              -0.028733822,
-              0.04047375,
-              0.13381885,
-              0.0068082553,
-              -0.016386433,
-              0.08218299,
-              -0.022658324,
-              -0.036435697,
-              0.06526089,
-              0.021031637,
-              -0.0054843347,
-              -0.038373824,
-              0.0014984249,
-              0.007331966,
-              0.01677609,
-              -0.06269722,
-              0.035417397,
-              -0.014398793,
-              0.027875954,
-              0.08376195,
-              -0.02777757,
-              -0.0036516306,
-              0.03904687,
-              -0.026841529,
-              -0.018736342,
-              0.01903094,
-              0.0651818,
-              0.0070574977,
-              0.0047951937,
-              -0.002987134,
-              0.04006833,
-              0.028001927,
-              -0.004688176,
-              0.012248329,
-              0.08704812,
-              -0.0070376135,
-              -0.037495255,
-              0.011267182,
-              0.015406452,
-              0.013771707,
-              0.017957818,
-              -0.009838073,
-              0.09011513,
-              0.051697087,
-              -0.034220304,
-              0.0043991045,
-              -0.018898288,
-              -0.031457234,
-              0.08212252,
-              0.016876385,
-              -0.022177191,
-              0.06844393,
-              0.015856383,
-              0.0203176,
-              0.0063723125,
-              0.016462969,
-              0.12720266,
-              0.014975143,
-              -0.010839063,
-              0.0017705995,
-              0.031662926,
-              -0.04433757,
-              -0.052297786,
-              0.022821713,
-              0.050960623,
-              -0.018954914,
-              0.0027527376,
-              -0.033637978,
-              -0.13569047,
-              -0.027035592,
-              -0.035660848,
-              -0.03351404,
-              0.047857523,
-              -0.0054172846,
-              0.02130265,
-              -0.040015485,
-              0.019387608,
-              0.012020892,
-              -0.043413315,
-              0.0005315479,
-              0.03484659,
-              0.017950043,
-              -0.062462628,
-              8.226272e-34,
-              -0.09449095,
-              0.013739951,
-              -0.025383765,
-              0.09899241,
-              0.04552389,
-              -0.020521628,
-              -0.029724384,
-              -0.059252843,
-              0.042447623,
-              0.08444559,
-              -0.043226957,
-              -0.0077667157,
-              0.049366944,
-              0.042077936,
-              -0.03653644,
-              0.014414636,
-              0.04032418,
-              -0.05892782,
-              0.010031362,
-              0.059879642,
-              -0.02792402,
-              0.03490713,
-              -0.08760264,
-              -0.060620386,
-              -0.0048639597,
-              0.087776646,
-              -0.005353071,
-              -0.02175546,
-              -0.048133314,
-              0.046915755,
-              0.008341115,
-              -0.05175852,
-              -0.02040021,
-              0.085782945,
-              -0.0226071,
-              0.034415677,
-              -0.014505325,
-              0.0030903826,
-              -0.046515204,
-              0.030268563,
-              0.039748456,
-              0.029745733,
-              -0.093127884,
-              0.051514212,
-              0.007829255,
-              -0.057012733,
-              -0.041812178,
-              0.089898124,
-              -0.008121904,
-              -0.040828798,
-              -0.05349857,
-              -0.034339238,
-              -0.045287646,
-              -0.097146384,
-              -0.058177214,
-              0.060921844,
-              -0.009064236,
-              0.0069495556,
-              0.012338063,
-              0.062054638,
-              -0.0060062264,
-              -0.08641508,
-              0.058708947,
-              0.053361338,
-              -0.05353899,
-              0.03950934,
-              -0.044963278,
-              0.07279474,
-              -0.0396003,
-              -0.051377922,
-              0.10337406,
-              0.021824561,
-              0.00013547574,
-              0.009485335,
-              0.021997929,
-              -0.0069047622,
-              -0.12891105,
-              -0.009861611,
-              -0.03639449,
-              -0.04249355,
-              0.0044484157,
-              -0.04767584,
-              0.0065166815,
-              0.1026327,
-              -0.053176586,
-              0.073318355,
-              0.015824493,
-              -0.029136809,
-              0.02512151,
-              -0.06307736,
-              -0.043478984,
-              0.067193694,
-              0.014923451,
-              -0.0011417158,
-              -0.098718524,
-              -1.4681537e-08,
-              0.00463343,
-              -0.06712206,
-              0.076443635,
-              -0.019814128,
-              0.0673915,
-              0.044810813,
-              -0.051008355,
-              -0.0077217882,
-              -0.02932436,
-              0.028841449,
-              0.018885555,
-              -0.024309436,
-              0.044141307,
-              0.044167083,
-              0.03432404,
-              0.046535607,
-              0.021588394,
-              -0.0017551337,
-              -0.0029986037,
-              0.014399799,
-              0.12530664,
-              0.034310702,
-              -0.0146423085,
-              0.03919942,
-              -0.002325517,
-              -0.014395083,
-              0.0100815315,
-              0.024295514,
-              -0.04172604,
-              0.08835341,
-              -0.031463772,
-              0.030068664,
-              -0.0029138532,
-              0.0048975134,
-              0.09590149,
-              0.09393541,
-              0.0141605595,
-              -0.07715167,
-              -0.039247666,
-              -0.010700626,
-              -0.008573732,
-              0.06410113,
-              -0.03301776,
-              -0.030493528,
-              0.09457071,
-              -0.008976579,
-              -0.029922878,
-              -0.13298088,
-              0.059931017,
-              -0.011697307,
-              0.007152748,
-              0.03558696,
-              0.0040925406,
-              0.056160007,
-              0.07656515,
-              -0.010041294,
-              0.0567585,
-              0.023536174,
-              -0.06379649,
-              0.08937482,
-              0.04375676,
-              0.043407574,
-              0.04633825,
-              -0.07037851
+              -0.024330618,
+              0.016706783,
+              0.037677176,
+              -0.00915746,
+              -0.030534461,
+              -0.017140884,
+              0.074272,
+              0.0456916,
+              -0.009377196,
+              0.009883053,
+              -0.0056895507,
+              0.007668296,
+              0.039537333,
+              0.015226257,
+              -0.083189555,
+              0.019439526,
+              -0.022046678,
+              -0.033254813,
+              -0.18105465,
+              -0.13025087,
+              -0.0022671346,
+              0.013451522,
+              -0.024325468,
+              -0.0370128,
+              0.0020083552,
+              0.08566712,
+              0.0047639925,
+              -0.0033431018,
+              -0.006082307,
+              -0.11575565,
+              0.06682902,
+              -0.018777572,
+              0.08786827,
+              -0.0074177794,
+              -0.093573004,
+              0.06146399,
+              -0.08110609,
+              0.012222862,
+              0.03971064,
+              -0.0026197461,
+              -0.04657111,
+              -0.08183902,
+              0.03959615,
+              0.015451151,
+              0.04370617,
+              0.103643835,
+              -0.058421485,
+              0.036699355,
+              -0.052699573,
+              0.040590122,
+              -0.12578927,
+              0.006500531,
+              -0.03583627,
+              -0.010050973,
+              -0.023851713,
+              0.045972254,
+              0.014605586,
+              0.019414552,
+              0.028465148,
+              -0.055030964,
+              0.024210233,
+              -0.052867457,
+              0.015230711,
+              -0.0043921247,
+              0.092372045,
+              0.033849865,
+              -0.04737281,
+              0.03204496,
+              0.001322036,
+              -0.051211488,
+              0.025862284,
+              0.08155327,
+              0.04092595,
+              0.019154705,
+              0.056453932,
+              -0.052758913,
+              0.030533386,
+              -0.01663434,
+              0.07877244,
+              -0.054262977,
+              -0.042149354,
+              -0.045443602,
+              -0.052689902,
+              0.11225497,
+              0.01989102,
+              -0.042375352,
+              -0.01168115,
+              0.024315914,
+              0.01915792,
+              -0.016550383,
+              -0.01030883,
+              -0.08545277,
+              0.023834355,
+              -0.042181373,
+              -0.02503509,
+              0.062114798,
+              -0.0045557353,
+              -0.15369569,
+              0.001106691,
+              0.19423288,
+              -0.0338511,
+              0.026152972,
+              -0.02032091,
+              0.0012884078,
+              -0.0010269672,
+              -0.02411262,
+              0.017495485,
+              -0.009808713,
+              0.07037937,
+              -0.13769862,
+              -0.11118059,
+              -0.01736481,
+              0.06603106,
+              -0.05188892,
+              0.0019610007,
+              0.014606686,
+              0.060775463,
+              0.096280165,
+              0.013551965,
+              0.019343173,
+              -0.00010512453,
+              -0.026652312,
+              -0.009341819,
+              0.07083247,
+              -0.0034617546,
+              -0.062412772,
+              -0.044611085,
+              -8.796679e-34,
+              -0.111884,
+              -0.04256611,
+              0.027425196,
+              0.06574074,
+              0.002830377,
+              -0.044104468,
+              0.005238822,
+              -0.036899913,
+              -0.015583552,
+              0.0206543,
+              -0.059225976,
+              0.007236511,
+              -0.028716031,
+              0.040467348,
+              0.13387093,
+              0.006795838,
+              -0.01636956,
+              0.082198486,
+              -0.02261007,
+              -0.03641293,
+              0.06524453,
+              0.021011814,
+              -0.005472363,
+              -0.038433436,
+              0.001462021,
+              0.0073671984,
+              0.016773427,
+              -0.062663026,
+              0.035388503,
+              -0.014395795,
+              0.027888605,
+              0.0837546,
+              -0.027772024,
+              -0.0036210797,
+              0.03903557,
+              -0.026879627,
+              -0.018737236,
+              0.019059159,
+              0.06522148,
+              0.0070414003,
+              0.004749159,
+              -0.0030224407,
+              0.040062208,
+              0.028016094,
+              -0.004660955,
+              0.012264517,
+              0.08708117,
+              -0.0070171114,
+              -0.03749808,
+              0.011326775,
+              0.015419708,
+              0.013775354,
+              0.017958472,
+              -0.009817919,
+              0.09011542,
+              0.05170552,
+              -0.034259036,
+              0.0043903207,
+              -0.01884889,
+              -0.031481344,
+              0.08216297,
+              0.016875258,
+              -0.022163702,
+              0.06844141,
+              0.01581623,
+              0.020322658,
+              0.0063856863,
+              0.016461994,
+              0.12718283,
+              0.014996434,
+              -0.010813858,
+              0.0017669421,
+              0.03166716,
+              -0.044353984,
+              -0.05225622,
+              0.022843942,
+              0.050988898,
+              -0.018916955,
+              0.0027930918,
+              -0.033645593,
+              -0.13571611,
+              -0.027015164,
+              -0.035672266,
+              -0.033537813,
+              0.047864296,
+              -0.0054381513,
+              0.021346755,
+              -0.040034927,
+              0.019374551,
+              0.012011466,
+              -0.04336231,
+              0.00054701004,
+              0.034879614,
+              0.017960642,
+              -0.062501945,
+              8.224154e-34,
+              -0.09450138,
+              0.013776636,
+              -0.025351105,
+              0.098992504,
+              0.045503527,
+              -0.02053458,
+              -0.029694881,
+              -0.059200566,
+              0.042453792,
+              0.0844487,
+              -0.043211546,
+              -0.0077362363,
+              0.049354795,
+              0.04203366,
+              -0.036539596,
+              0.014424774,
+              0.040357023,
+              -0.058971472,
+              0.010022987,
+              0.059877146,
+              -0.02790864,
+              0.034927685,
+              -0.087597504,
+              -0.060616262,
+              -0.0048867166,
+              0.08776906,
+              -0.0053599468,
+              -0.021816833,
+              -0.048162397,
+              0.046919785,
+              0.0083988905,
+              -0.0517289,
+              -0.020422187,
+              0.08581073,
+              -0.022597926,
+              0.034425046,
+              -0.014506674,
+              0.0031332907,
+              -0.04651877,
+              0.030281488,
+              0.039713897,
+              0.02969227,
+              -0.09310218,
+              0.051527865,
+              0.007809,
+              -0.05700871,
+              -0.041792583,
+              0.08987064,
+              -0.00813404,
+              -0.04082285,
+              -0.053487595,
+              -0.034378976,
+              -0.045253906,
+              -0.09715307,
+              -0.058194414,
+              0.06093547,
+              -0.009079956,
+              0.006918499,
+              0.012345728,
+              0.062036473,
+              -0.0060238577,
+              -0.0864295,
+              0.05872831,
+              0.053304974,
+              -0.05352623,
+              0.039521407,
+              -0.04498403,
+              0.0727911,
+              -0.039616212,
+              -0.05134442,
+              0.10334881,
+              0.02176773,
+              0.00016648973,
+              0.009423309,
+              0.022016358,
+              -0.006902813,
+              -0.128883,
+              -0.009864072,
+              -0.036396757,
+              -0.042481646,
+              0.004420737,
+              -0.047660243,
+              0.0065179355,
+              0.102602735,
+              -0.053166825,
+              0.07328581,
+              0.015810944,
+              -0.029149039,
+              0.025130944,
+              -0.063055776,
+              -0.043462534,
+              0.06719971,
+              0.014921177,
+              -0.0010985207,
+              -0.09869465,
+              -1.4682753e-08,
+              0.004611013,
+              -0.06715223,
+              0.07644809,
+              -0.019802453,
+              0.06737909,
+              0.044783685,
+              -0.050963327,
+              -0.0077186874,
+              -0.029319718,
+              0.028867716,
+              0.018877175,
+              -0.024279349,
+              0.04412064,
+              0.04416273,
+              0.03432814,
+              0.046517964,
+              0.02158077,
+              -0.001748483,
+              -0.0029956794,
+              0.014355785,
+              0.12525895,
+              0.03431845,
+              -0.014617591,
+              0.039184693,
+              -0.0023036227,
+              -0.014352919,
+              0.01010173,
+              0.02430961,
+              -0.041730728,
+              0.08832413,
+              -0.031459343,
+              0.030073628,
+              -0.0029376182,
+              0.0049478672,
+              0.09588392,
+              0.09396655,
+              0.01412568,
+              -0.077148266,
+              -0.039246846,
+              -0.01064901,
+              -0.008556093,
+              0.06409403,
+              -0.033037152,
+              -0.03049978,
+              0.0945846,
+              -0.008954658,
+              -0.029921891,
+              -0.132985,
+              0.059934624,
+              -0.011668423,
+              0.0071737366,
+              0.035627652,
+              0.0041028745,
+              0.056198087,
+              0.07656151,
+              -0.010067092,
+              0.05678312,
+              0.023536043,
+              -0.063770495,
+              0.08934554,
+              0.043756966,
+              0.04337246,
+              0.046287052,
+              -0.07039028
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/7354ec181984.json b/tests/integration/recordings/responses/7354ec181984.json
index 0404c6a6a..b73a7cd50 100644
--- a/tests/integration/recordings/responses/7354ec181984.json
+++ b/tests/integration/recordings/responses/7354ec181984.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-07-31T17:51:16.201313167Z",
+        "created_at": "2025-09-03T17:39:54.374714Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 27475921912,
-        "load_duration": 40564716,
+        "total_duration": 6321793333,
+        "load_duration": 182255958,
         "prompt_eval_count": 25,
-        "prompt_eval_duration": 964907432,
+        "prompt_eval_duration": 67964459,
         "eval_count": 150,
-        "eval_duration": 26469935419,
+        "eval_duration": 6070867875,
         "response": "The smallest country in the world is the Vatican City, which has a total area of approximately 0.44 km\u00b2 (0.17 sq mi). It is an independent city-state located within Rome, Italy, and is home to the Pope and the central government of the Catholic Church.\n\nTo put that into perspective, the Vatican City is smaller than a golf course! Despite its tiny size, it has its own government, currency, postal system, and even its own police force. It's also home to numerous iconic landmarks like St. Peter's Basilica and the Sistine Chapel.\n\nInterestingly, the Vatican City is not only the smallest country in the world but also the most densely populated, with a population of just over 800 people!",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/75d0dd9d0fa3.json b/tests/integration/recordings/responses/75d0dd9d0fa3.json
index 52c5d574d..561fa1e67 100644
--- a/tests/integration/recordings/responses/75d0dd9d0fa3.json
+++ b/tests/integration/recordings/responses/75d0dd9d0fa3.json
@@ -45,15 +45,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-08-04T22:55:10.58267Z",
+        "created_at": "2025-09-03T17:36:17.508028Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 1981967792,
-        "load_duration": 63184458,
+        "total_duration": 1529591917,
+        "load_duration": 84990667,
         "prompt_eval_count": 119,
-        "prompt_eval_duration": 259000000,
+        "prompt_eval_duration": 189045583,
         "eval_count": 29,
-        "eval_duration": 1582000000,
+        "eval_duration": 1254813583,
         "response": "{ \"name\": \"Michael Jordan\", \"year_born\": \"1963\", \"year_retired\": \"2003\"}\n    ",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/7b25b702ea18.json b/tests/integration/recordings/responses/7b25b702ea18.json
index bf8fb73d9..29a978e07 100644
--- a/tests/integration/recordings/responses/7b25b702ea18.json
+++ b/tests/integration/recordings/responses/7b25b702ea18.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              0.06829144,
-              0.061772227,
-              -0.0064161597,
-              0.082678765,
-              -0.07824987,
-              0.026521353,
-              0.13125585,
-              0.041369338,
-              -0.019540362,
-              -0.02709599,
-              0.0887907,
-              -0.10275329,
-              0.050712623,
-              -0.07134879,
-              -0.009282846,
-              -0.039247703,
-              0.028860288,
-              -0.01049117,
-              -0.024684245,
-              -0.035460133,
-              -0.04094595,
-              -0.009883736,
-              -0.026154075,
-              0.057957783,
-              -0.00061253883,
-              0.0076184087,
-              0.013905776,
-              -0.0016500223,
-              0.044650607,
-              -0.05900644,
-              -0.037936445,
-              0.037789088,
-              -0.03326097,
-              0.07172011,
-              0.09720765,
-              -0.082623295,
-              0.027609807,
-              -0.014166528,
-              0.018201344,
-              -0.0026497827,
-              -0.024251994,
-              -0.114919275,
-              0.08516042,
-              -0.01674906,
-              -0.0063111004,
-              0.06525075,
-              -0.058014978,
-              0.09666779,
-              -0.014186084,
-              -0.006836795,
-              -0.09889106,
-              -0.015126775,
-              -0.0783394,
-              -0.03557229,
-              -0.008273864,
-              -0.013632112,
-              -0.07621237,
-              -0.03039195,
-              -0.0135569805,
-              0.050146695,
-              -0.01059567,
-              -0.03840819,
-              0.0674032,
-              0.035650622,
-              0.010801949,
-              -0.07822949,
-              -0.0068962453,
-              -0.03009482,
-              0.055947337,
-              -0.07680802,
-              -0.009078504,
-              -0.002788809,
-              -0.02937109,
-              0.06879565,
-              0.013748122,
-              0.030850956,
-              -0.03644146,
-              -0.07147028,
-              0.05473256,
-              -0.028970802,
-              -0.064664625,
-              -0.059753876,
-              -0.067655295,
-              0.022762805,
-              0.07949517,
-              0.051779337,
-              0.14793634,
-              -0.0025083658,
-              -0.05545431,
-              -0.027768994,
-              0.019383226,
-              0.06685648,
-              -0.0795505,
-              0.01904091,
-              -0.00094253226,
-              0.0134609025,
-              0.03820869,
-              -0.040206373,
-              0.0649827,
-              0.13925305,
-              0.059302386,
-              0.018050361,
-              -0.049063586,
-              -0.057463937,
-              -0.17034325,
-              0.0098234955,
-              0.04479311,
-              -0.08709996,
-              0.046848226,
-              -0.02031104,
-              -0.062256135,
-              0.030291956,
-              0.04995267,
-              -0.03062274,
-              -0.007244306,
-              -0.06063938,
-              -0.0057327296,
-              0.028709931,
-              -0.055921447,
-              -0.006099839,
-              0.07552849,
-              0.073059924,
-              -0.031967085,
-              -0.027995033,
-              -0.0013227675,
-              0.0237769,
-              0.08236448,
-              -2.0790976e-33,
-              0.014696224,
-              -0.0849667,
-              0.05938996,
-              -0.007827523,
-              -0.015969144,
-              0.025970377,
-              0.03762491,
-              0.1256464,
-              -0.04001108,
-              0.024740757,
-              0.014459392,
-              -0.063038975,
-              0.0340931,
-              -0.0076668505,
-              0.008167134,
-              0.10462719,
-              0.018821232,
-              -0.021525906,
-              -0.04383254,
-              0.05684103,
-              0.016244315,
-              -0.07351815,
-              0.02012839,
-              0.05243149,
-              0.015002977,
-              -0.06589196,
-              -0.032537818,
-              0.024986163,
-              0.018428918,
-              -0.0003134351,
-              -0.06270619,
-              -0.0061910586,
-              -0.16043852,
-              0.028163772,
-              0.033009354,
-              0.03727067,
-              0.05406701,
-              -0.007932531,
-              -0.008608034,
-              0.054109853,
-              -0.046951395,
-              -0.03869324,
-              0.084930494,
-              -0.005905675,
-              0.021937586,
-              -0.052074514,
-              -0.047481276,
-              -0.054886986,
-              0.034032077,
-              -0.02832154,
-              -0.032060325,
-              -0.0013834401,
-              -0.040383566,
-              -0.017775834,
-              0.05222146,
-              0.0038051854,
-              0.008726582,
-              0.032692313,
-              0.010791591,
-              0.11194475,
-              -0.019752404,
-              -0.045764305,
-              -0.0020202047,
-              0.020939285,
-              -0.006159919,
-              -0.0017409867,
-              -0.0068266885,
-              -0.081341885,
-              0.091841556,
-              0.048661314,
-              0.07770758,
-              -0.058719456,
-              0.0063417573,
-              0.0036042097,
-              -0.071244255,
-              0.022036737,
-              0.019486615,
-              0.101281255,
-              0.0066442927,
-              -0.044674896,
-              0.06144362,
-              -0.09196092,
-              -0.0133002605,
-              0.014585881,
-              -0.017600225,
-              0.007354116,
-              0.006177494,
-              -0.048051644,
-              0.013157643,
-              -0.07767093,
-              0.014147597,
-              0.035391673,
-              -0.026176892,
-              0.002718191,
-              0.08641935,
-              9.148517e-34,
-              -0.022012252,
-              0.05088286,
-              -0.02727955,
-              0.028613139,
-              0.013718326,
-              -0.07109317,
-              0.09039982,
-              -0.090625234,
-              -0.06567498,
-              0.06685471,
-              0.066993244,
-              -0.05015442,
-              0.019033352,
-              -0.041487213,
-              0.012605603,
-              0.06907699,
-              0.0281946,
-              -0.070972204,
-              -0.061149873,
-              0.031668104,
-              -0.09625139,
-              0.13133687,
-              -0.0035538,
-              -0.027149519,
-              -0.06298852,
-              -0.0009207272,
-              -0.008693039,
-              -0.031348817,
-              -0.018568903,
-              0.011527607,
-              0.07185478,
-              -0.071952716,
-              -0.0059043416,
-              0.09352268,
-              0.046653684,
-              -0.031974927,
-              0.069581434,
-              -0.045875963,
-              0.010133493,
-              0.064104505,
-              0.07243221,
-              0.04723149,
-              0.04880478,
-              0.06762142,
-              0.005496453,
-              0.035764992,
-              0.01831371,
-              -0.038210426,
-              0.050088413,
-              0.041379653,
-              -0.02544787,
-              0.021565115,
-              0.014279919,
-              -0.0071081445,
-              -0.014286643,
-              -0.010122217,
-              -0.091654085,
-              0.009356054,
-              0.0043320316,
-              -0.009591156,
-              -0.029850187,
-              0.17471492,
-              -0.0045922897,
-              0.05783941,
-              -0.044838578,
-              -0.051453117,
-              -0.045911513,
-              0.007451434,
-              0.0054590874,
-              0.039563954,
-              -0.05625489,
-              -0.0022330268,
-              0.047820278,
-              -0.039598763,
-              0.027334856,
-              0.039694488,
-              -0.07971524,
-              0.03508072,
-              0.029276432,
-              0.010155507,
-              -0.039020576,
-              -0.027874392,
-              -0.040846046,
-              0.046112783,
-              -0.069308,
-              0.061977327,
-              0.039240442,
-              0.025863856,
-              0.0064374707,
-              0.053631745,
-              0.06962397,
-              -0.008001055,
-              -0.03827026,
-              -0.10952415,
-              0.018512232,
-              -1.3332562e-08,
-              -0.025684418,
-              -0.07470214,
-              -0.019860886,
-              0.0385072,
-              0.027302178,
-              -0.010903615,
-              -0.03522558,
-              0.036009304,
-              -0.06320341,
-              0.011506822,
-              0.03339635,
-              -0.012044345,
-              0.004013396,
-              0.016582591,
-              -0.007978201,
-              -0.041656163,
-              -0.07090684,
-              0.008757652,
-              0.004474724,
-              -0.038768765,
-              -0.05130229,
-              0.017759493,
-              -0.018255858,
-              0.043951545,
-              -0.04284978,
-              0.08247418,
-              0.015467272,
-              0.022083104,
-              0.044421837,
-              0.022857197,
-              0.08298176,
-              -0.012647776,
-              0.013097686,
-              -0.06692538,
-              0.047861587,
-              -0.04503364,
-              0.006510086,
-              0.0056154854,
-              -0.019552445,
-              -0.017313117,
-              -0.038419757,
-              -0.00048296133,
-              -0.008638455,
-              -0.026783587,
-              -0.06596831,
-              -0.14337558,
-              0.041494913,
-              -0.04859091,
-              0.012739855,
-              -0.085007615,
-              -0.010923813,
-              -0.03816371,
-              0.03006815,
-              -0.03887654,
-              -0.036665756,
-              0.046499304,
-              0.036260363,
-              0.052359663,
-              -0.09627654,
-              -0.041531097,
-              0.05020932,
-              -7.9168685e-06,
-              0.0019163007,
-              0.0195528
+              0.06829306,
+              0.061738,
+              -0.0064223274,
+              0.08267553,
+              -0.07827752,
+              0.026546001,
+              0.13129343,
+              0.041391023,
+              -0.01950488,
+              -0.027131394,
+              0.08875853,
+              -0.10276945,
+              0.05070562,
+              -0.07138499,
+              -0.0092889285,
+              -0.039247777,
+              0.028884362,
+              -0.010484688,
+              -0.02469515,
+              -0.0354649,
+              -0.04093021,
+              -0.009903105,
+              -0.026185337,
+              0.057967436,
+              -0.00060980336,
+              0.007659294,
+              0.013928803,
+              -0.0016587646,
+              0.044655163,
+              -0.058990903,
+              -0.037958965,
+              0.037799176,
+              -0.033270117,
+              0.071682036,
+              0.09722083,
+              -0.08261939,
+              0.027622383,
+              -0.014190519,
+              0.01816939,
+              -0.002717151,
+              -0.02426505,
+              -0.11493204,
+              0.0851599,
+              -0.016752614,
+              -0.006310121,
+              0.065255314,
+              -0.058001935,
+              0.096675195,
+              -0.01419834,
+              -0.0068260576,
+              -0.09889976,
+              -0.015109596,
+              -0.07833432,
+              -0.035589334,
+              -0.008278154,
+              -0.013655421,
+              -0.07625151,
+              -0.030405698,
+              -0.013589333,
+              0.050117858,
+              -0.010591754,
+              -0.038398717,
+              0.067407176,
+              0.03565695,
+              0.010748793,
+              -0.0782303,
+              -0.006898065,
+              -0.03009224,
+              0.05595709,
+              -0.076849714,
+              -0.009063107,
+              -0.0028242348,
+              -0.02941444,
+              0.06881705,
+              0.013745148,
+              0.03078439,
+              -0.036471423,
+              -0.07147355,
+              0.054742936,
+              -0.028959772,
+              -0.06466119,
+              -0.05974295,
+              -0.06766193,
+              0.022777116,
+              0.079530336,
+              0.051767077,
+              0.14789894,
+              -0.0024908637,
+              -0.05542459,
+              -0.027760198,
+              0.019384151,
+              0.06692773,
+              -0.07952434,
+              0.019047031,
+              -0.00097613735,
+              0.013479467,
+              0.038207904,
+              -0.040212464,
+              0.06499357,
+              0.13929029,
+              0.0592868,
+              0.018087199,
+              -0.04910378,
+              -0.057469312,
+              -0.17034933,
+              0.009854021,
+              0.04478709,
+              -0.08707103,
+              0.046889827,
+              -0.020303966,
+              -0.062274974,
+              0.030287566,
+              0.04991786,
+              -0.030625034,
+              -0.007196787,
+              -0.060630832,
+              -0.0057445914,
+              0.028697284,
+              -0.055902485,
+              -0.0060850815,
+              0.075516894,
+              0.07304865,
+              -0.03200336,
+              -0.027994294,
+              -0.0013179975,
+              0.02373418,
+              0.082337655,
+              -2.0787389e-33,
+              0.014712573,
+              -0.084956154,
+              0.059368864,
+              -0.00785449,
+              -0.015981624,
+              0.02598549,
+              0.037614744,
+              0.12561654,
+              -0.04002324,
+              0.02472032,
+              0.014450717,
+              -0.06304021,
+              0.034111217,
+              -0.00766782,
+              0.008186535,
+              0.10461876,
+              0.018852819,
+              -0.021535609,
+              -0.04381762,
+              0.05679568,
+              0.01621111,
+              -0.0734938,
+              0.020150887,
+              0.05246773,
+              0.015011716,
+              -0.06588331,
+              -0.03257114,
+              0.025002314,
+              0.018430108,
+              -0.00030111038,
+              -0.06266604,
+              -0.006196726,
+              -0.16044672,
+              0.028114004,
+              0.032982383,
+              0.037261836,
+              0.0540566,
+              -0.0079226745,
+              -0.008597091,
+              0.054075282,
+              -0.046998158,
+              -0.03870267,
+              0.08493371,
+              -0.005938313,
+              0.021924777,
+              -0.05206361,
+              -0.047436308,
+              -0.054906387,
+              0.03400277,
+              -0.028335828,
+              -0.032045983,
+              -0.0013805287,
+              -0.04042137,
+              -0.017744336,
+              0.052251115,
+              0.0038320236,
+              0.008692022,
+              0.03270182,
+              0.010805367,
+              0.11194987,
+              -0.019722551,
+              -0.04577441,
+              -0.002028829,
+              0.020897591,
+              -0.006168528,
+              -0.0017238662,
+              -0.006808375,
+              -0.08133367,
+              0.091827765,
+              0.048646383,
+              0.07771223,
+              -0.05870435,
+              0.006373254,
+              0.0036029797,
+              -0.071249805,
+              0.022061123,
+              0.019477166,
+              0.10132688,
+              0.006618212,
+              -0.044631813,
+              0.06139753,
+              -0.09197761,
+              -0.013284173,
+              0.014608393,
+              -0.01761416,
+              0.0073858253,
+              0.0062043094,
+              -0.048021033,
+              0.013127433,
+              -0.077592075,
+              0.014133566,
+              0.035386372,
+              -0.02616333,
+              0.0027075391,
+              0.08635036,
+              9.132231e-34,
+              -0.022040669,
+              0.05085595,
+              -0.027267562,
+              0.02862394,
+              0.0137278,
+              -0.07108621,
+              0.09040417,
+              -0.09064723,
+              -0.0656353,
+              0.06688156,
+              0.06701843,
+              -0.05015593,
+              0.01906404,
+              -0.04147956,
+              0.012601856,
+              0.06909683,
+              0.028203059,
+              -0.0709644,
+              -0.061153468,
+              0.031663477,
+              -0.09626921,
+              0.13134153,
+              -0.003593543,
+              -0.027185699,
+              -0.06297406,
+              -0.00092433795,
+              -0.008680087,
+              -0.031325806,
+              -0.018586429,
+              0.011512126,
+              0.071864344,
+              -0.071975954,
+              -0.005884031,
+              0.09355209,
+              0.046686243,
+              -0.031970512,
+              0.06956754,
+              -0.045880646,
+              0.010095539,
+              0.064092614,
+              0.07247815,
+              0.04723167,
+              0.048781574,
+              0.06763336,
+              0.0054456857,
+              0.035764687,
+              0.018254038,
+              -0.03819517,
+              0.050082564,
+              0.04140595,
+              -0.025459196,
+              0.021584416,
+              0.014274055,
+              -0.007126868,
+              -0.014268015,
+              -0.010105026,
+              -0.09164537,
+              0.009354007,
+              0.004333732,
+              -0.009582354,
+              -0.029860867,
+              0.17471065,
+              -0.0045884773,
+              0.05782756,
+              -0.044819925,
+              -0.051430847,
+              -0.045887176,
+              0.0074449414,
+              0.0054387357,
+              0.039599653,
+              -0.056232683,
+              -0.002221041,
+              0.047835752,
+              -0.039582185,
+              0.027316216,
+              0.039718047,
+              -0.07969795,
+              0.03511298,
+              0.029242206,
+              0.010144028,
+              -0.03904501,
+              -0.027879883,
+              -0.040858228,
+              0.04611512,
+              -0.06931006,
+              0.061977647,
+              0.03922111,
+              0.025860278,
+              0.0064425017,
+              0.053613506,
+              0.069628745,
+              -0.007990142,
+              -0.038263973,
+              -0.10954397,
+              0.018542184,
+              -1.33346125e-08,
+              -0.025668526,
+              -0.07473254,
+              -0.019855365,
+              0.0384919,
+              0.027314084,
+              -0.010875396,
+              -0.035207637,
+              0.036075134,
+              -0.063237526,
+              0.011492366,
+              0.03342596,
+              -0.012063488,
+              0.0039839908,
+              0.016522188,
+              -0.008002217,
+              -0.04168924,
+              -0.07092195,
+              0.008746656,
+              0.004452133,
+              -0.03877822,
+              -0.051253635,
+              0.01774984,
+              -0.018253444,
+              0.04394154,
+              -0.042883426,
+              0.08245372,
+              0.015452854,
+              0.022076968,
+              0.04442366,
+              0.022832815,
+              0.08296971,
+              -0.01261236,
+              0.013092747,
+              -0.06689178,
+              0.0478462,
+              -0.04507667,
+              0.006519156,
+              0.0055980994,
+              -0.019575223,
+              -0.01730519,
+              -0.03837497,
+              -0.00043787624,
+              -0.008650636,
+              -0.026787039,
+              -0.06598753,
+              -0.14336495,
+              0.041543495,
+              -0.048590284,
+              0.012749011,
+              -0.08499328,
+              -0.010950221,
+              -0.038154602,
+              0.030090204,
+              -0.03886871,
+              -0.03670644,
+              0.046492297,
+              0.03623469,
+              0.052362714,
+              -0.09623828,
+              -0.04149126,
+              0.050219554,
+              -2.084757e-05,
+              0.0019338154,
+              0.019553935
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/7b4815aba6c5.json b/tests/integration/recordings/responses/7b4815aba6c5.json
index 2843b8a9c..f1e8e7165 100644
--- a/tests/integration/recordings/responses/7b4815aba6c5.json
+++ b/tests/integration/recordings/responses/7b4815aba6c5.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.222059Z",
+          "created_at": "2025-09-03T17:37:48.840898Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.273466Z",
+          "created_at": "2025-09-03T17:37:48.883619Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.325562Z",
+          "created_at": "2025-09-03T17:37:48.92504Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.379223Z",
+          "created_at": "2025-09-03T17:37:48.966274Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.436435Z",
+          "created_at": "2025-09-03T17:37:49.007525Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.48928Z",
+          "created_at": "2025-09-03T17:37:49.049125Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.547102Z",
+          "created_at": "2025-09-03T17:37:49.090893Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.60579Z",
+          "created_at": "2025-09-03T17:37:49.132101Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.660149Z",
+          "created_at": "2025-09-03T17:37:49.17401Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.719166Z",
+          "created_at": "2025-09-03T17:37:49.216115Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.773893Z",
+          "created_at": "2025-09-03T17:37:49.257109Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.827636Z",
+          "created_at": "2025-09-03T17:37:49.298731Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,7 +238,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.905205Z",
+          "created_at": "2025-09-03T17:37:49.338833Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -256,7 +256,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:59.959347Z",
+          "created_at": "2025-09-03T17:37:49.38053Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -274,7 +274,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:00.037904Z",
+          "created_at": "2025-09-03T17:37:49.421378Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -292,7 +292,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:00.093527Z",
+          "created_at": "2025-09-03T17:37:49.462646Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -310,7 +310,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:00.151329Z",
+          "created_at": "2025-09-03T17:37:49.503814Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -328,7 +328,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:00.209463Z",
+          "created_at": "2025-09-03T17:37:49.545397Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -346,15 +346,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:00.268012Z",
+          "created_at": "2025-09-03T17:37:49.586834Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1981034959,
-          "load_duration": 53445084,
+          "total_duration": 1409239209,
+          "load_duration": 118889250,
           "prompt_eval_count": 368,
-          "prompt_eval_duration": 880000000,
+          "prompt_eval_duration": 543077166,
           "eval_count": 19,
-          "eval_duration": 1046000000,
+          "eval_duration": 746733584,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/7e6806cba34a.json b/tests/integration/recordings/responses/7e6806cba34a.json
index 7b1d5261e..e2e32da73 100644
--- a/tests/integration/recordings/responses/7e6806cba34a.json
+++ b/tests/integration/recordings/responses/7e6806cba34a.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:14.382398152Z",
+          "created_at": "2025-09-03T17:41:43.22891Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:14.561084788Z",
+          "created_at": "2025-09-03T17:41:43.268911Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:14.743154167Z",
+          "created_at": "2025-09-03T17:41:43.310121Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:14.920818124Z",
+          "created_at": "2025-09-03T17:41:43.35053Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:15.099067906Z",
+          "created_at": "2025-09-03T17:41:43.391033Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:15.274401879Z",
+          "created_at": "2025-09-03T17:41:43.431414Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:15.449669669Z",
+          "created_at": "2025-09-03T17:41:43.471553Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:15.626501213Z",
+          "created_at": "2025-09-03T17:41:43.512029Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:15.802614623Z",
+          "created_at": "2025-09-03T17:41:43.55268Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:15.978698104Z",
+          "created_at": "2025-09-03T17:41:43.594309Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,7 +201,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:16.160654179Z",
+          "created_at": "2025-09-03T17:41:43.635445Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -219,7 +219,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:16.338412914Z",
+          "created_at": "2025-09-03T17:41:43.676541Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -237,15 +237,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-31T17:59:16.521646436Z",
+          "created_at": "2025-09-03T17:41:43.717809Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 4555044563,
-          "load_duration": 43101307,
+          "total_duration": 820540625,
+          "load_duration": 111045959,
           "prompt_eval_count": 29,
-          "prompt_eval_duration": 2371036213,
+          "prompt_eval_duration": 219693291,
           "eval_count": 13,
-          "eval_duration": 2140342701,
+          "eval_duration": 489282542,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/802f60021837.json b/tests/integration/recordings/responses/802f60021837.json
index 7ba0466c4..a17aa4af3 100644
--- a/tests/integration/recordings/responses/802f60021837.json
+++ b/tests/integration/recordings/responses/802f60021837.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.0623061,
-              0.043155346,
-              -0.056864023,
-              0.03486763,
-              -0.045145836,
-              -0.13253546,
-              0.021805322,
-              0.039048277,
-              -0.04841761,
-              -0.031872153,
-              -0.039334167,
-              0.0063758655,
-              0.07872078,
-              -0.0042740484,
-              0.023612525,
-              -0.02170506,
-              -0.055740308,
-              -0.0094528515,
-              0.039697133,
-              -0.11445638,
-              -0.011568856,
-              0.06161228,
-              -0.02625024,
-              0.024374798,
-              0.029430348,
-              -0.0035586308,
-              -0.0014398397,
-              -0.00313635,
-              0.013770647,
-              -0.0002185752,
-              -0.014788754,
-              0.084392585,
-              0.06679723,
-              0.042302314,
-              0.007701145,
-              0.073157564,
-              -0.008342027,
-              -0.09463514,
-              -0.09247907,
-              0.00763349,
-              -0.07390047,
-              0.015466744,
-              -0.04406345,
-              -0.044970937,
-              -0.041317657,
-              0.06967893,
-              -0.02747757,
-              0.014388817,
-              -0.036104802,
-              -0.006673772,
-              -0.08029175,
-              -6.000176e-05,
-              -0.038977537,
-              -0.049003445,
-              0.017844146,
-              -0.0064918958,
-              0.059797343,
-              -0.003170151,
-              -0.024797099,
-              -0.11498058,
-              -0.047404848,
-              0.0185016,
-              -0.009826349,
-              0.09572491,
-              -0.009429792,
-              -0.03576324,
-              -0.031269584,
-              -0.0032131649,
-              0.07714364,
-              -0.07617566,
-              -0.118788,
-              -0.06321078,
-              -0.0046245204,
-              0.06524506,
-              0.04577385,
-              -0.13796814,
-              0.04598187,
-              -0.03355735,
-              -0.013584839,
-              0.0045000566,
-              0.017061453,
-              -0.0016859988,
-              -0.051290352,
-              0.102515854,
-              0.015375054,
-              -0.053396687,
-              0.046739385,
-              0.11428208,
-              -0.0060018655,
-              0.010324239,
-              -0.031606395,
-              -0.051939677,
-              0.020962074,
-              0.008873621,
-              -0.06903091,
-              0.08133413,
-              0.012089255,
-              -0.06411361,
-              -0.03635769,
-              0.046689924,
-              0.011246541,
-              -0.05031814,
-              0.073784724,
-              -0.021187203,
-              0.03246321,
-              -0.026193537,
-              0.06816752,
-              -0.03795416,
-              0.030822705,
-              -0.0371306,
-              -0.03693002,
-              -0.029442247,
-              -0.032879222,
-              -0.005807539,
-              0.04255175,
-              0.054692194,
-              -0.0192783,
-              0.12276652,
-              0.0037922377,
-              0.0320851,
-              0.023700258,
-              0.019210111,
-              0.019973421,
-              -0.012249867,
-              -0.03246148,
-              -0.0044806604,
-              -0.035679862,
-              -6.954278e-33,
-              -0.0220099,
-              -0.06862265,
-              -0.03537707,
-              0.008910154,
-              0.071089186,
-              -0.025226729,
-              0.091465496,
-              -0.009329111,
-              -0.05951072,
-              -0.034704443,
-              0.04334736,
-              0.03334519,
-              0.024234882,
-              0.08795047,
-              0.020609507,
-              -0.0008948477,
-              -0.013011299,
-              0.08836162,
-              0.045687113,
-              0.025813619,
-              0.0542986,
-              0.09676311,
-              0.023140479,
-              0.024307383,
-              0.014198938,
-              -0.018661225,
-              -0.024505567,
-              -0.03258764,
-              0.025222383,
-              0.016810626,
-              -0.07629099,
-              0.012676406,
-              -0.021304907,
-              0.006898141,
-              0.030808464,
-              -0.000315505,
-              0.0005437531,
-              -0.08589918,
-              0.04053157,
-              0.006305948,
-              -0.010008999,
-              0.0015841384,
-              0.012631508,
-              -0.036505677,
-              -0.023090534,
-              0.012400456,
-              -0.00514819,
-              0.020243159,
-              -0.08760989,
-              0.045204975,
-              -0.0012632157,
-              -0.06573619,
-              0.07478642,
-              0.08402555,
-              -0.013935989,
-              0.05592361,
-              0.019318154,
-              -0.019661061,
-              -0.016006675,
-              -0.02916137,
-              0.0373911,
-              0.06808347,
-              0.06916834,
-              -0.0076644514,
-              0.02114384,
-              0.04043145,
-              0.03511955,
-              0.08206532,
-              0.08808922,
-              0.050526854,
-              -0.059352025,
-              0.04576268,
-              -0.025140414,
-              0.03584363,
-              -0.02806783,
-              0.019853832,
-              0.033893492,
-              -0.07974513,
-              0.023001093,
-              0.062465888,
-              -0.034909748,
-              -0.05390039,
-              -0.016120961,
-              -0.0057214363,
-              -0.030499708,
-              -0.02269443,
-              -0.010363369,
-              0.067623645,
-              -0.010582917,
-              -0.09608072,
-              -0.07854503,
-              -0.085294046,
-              0.029974943,
-              -0.005945623,
-              -0.039578382,
-              2.9788035e-33,
-              0.0114961,
-              0.010420429,
-              -0.06988839,
-              0.019277215,
-              -0.08453786,
-              -0.085693836,
-              0.06625677,
-              0.063027605,
-              0.050445113,
-              0.033733714,
-              -0.0058911345,
-              -0.06960736,
-              0.12548403,
-              0.021376437,
-              0.07414455,
-              0.034223642,
-              -0.045840543,
-              0.014842206,
-              -0.0126910545,
-              0.003648386,
-              -0.08023818,
-              0.06729063,
-              -0.056022517,
-              -0.08669063,
-              -0.027885731,
-              -0.033907417,
-              -0.038715098,
-              -0.07791038,
-              -0.017792802,
-              0.061793778,
-              0.014706543,
-              0.020005805,
-              -0.08145671,
-              0.05236086,
-              0.06286303,
-              -0.0015804858,
-              0.040509794,
-              -0.027593212,
-              -0.009631841,
-              -0.017296297,
-              0.11391202,
-              0.04420345,
-              0.03534961,
-              0.12113969,
-              0.018799841,
-              0.049258087,
-              -0.036080077,
-              0.07791577,
-              -0.029658308,
-              -0.070674755,
-              -0.0067282193,
-              0.006079021,
-              0.04225839,
-              -0.039644253,
-              -0.04860991,
-              -0.039792407,
-              0.032389786,
-              0.033703297,
-              -0.0924961,
-              -0.04988354,
-              -0.06596082,
-              -0.04236528,
-              0.03126068,
-              0.011825378,
-              -0.044250805,
-              0.046862055,
-              -0.123014495,
-              -0.034661833,
-              -0.01387497,
-              -0.13120808,
-              0.14482524,
-              0.0056040953,
-              -0.0031055296,
-              0.022885982,
-              -0.07644984,
-              0.016439024,
-              -0.019532247,
-              -0.024956707,
-              -0.0685838,
-              0.07072798,
-              0.026639467,
-              -0.0351677,
-              -0.0015660838,
-              0.02932653,
-              -0.089445055,
-              -0.022545021,
-              -0.03112053,
-              0.053812344,
-              0.007873327,
-              0.023094172,
-              -0.0043896562,
-              0.05380028,
-              0.017278776,
-              0.056359384,
-              -0.05330339,
-              -1.3478282e-08,
-              -0.039658625,
-              0.013374887,
-              0.03682183,
-              0.009698332,
-              0.0046835328,
-              0.06660773,
-              0.022911774,
-              -0.047426622,
-              -0.040507935,
-              0.006813708,
-              0.0086692255,
-              -0.0063030533,
-              -0.04566467,
-              -0.06387448,
-              -0.013173488,
-              0.11698006,
-              0.016895978,
-              -0.0013877428,
-              0.02321246,
-              0.022267532,
-              0.078508325,
-              -0.045089863,
-              -0.009183129,
-              0.066403426,
-              -0.06653049,
-              -0.0154824555,
-              0.054102156,
-              0.07644729,
-              0.008254354,
-              -0.124090366,
-              0.012699053,
-              -0.017593145,
-              -0.020621033,
-              0.032500766,
-              -0.012999753,
-              0.022328354,
-              0.010528125,
-              -0.08832318,
-              0.02148152,
-              -0.0029870127,
-              -0.03183275,
-              0.07181985,
-              0.01038717,
-              0.0036043858,
-              0.048932884,
-              0.07041019,
-              -0.036562778,
-              -0.03517641,
-              -0.03654687,
-              -0.07017274,
-              -0.03033558,
-              0.02860758,
-              -0.019075464,
-              -0.002551204,
-              0.02127327,
-              0.074368805,
-              -0.11424493,
-              -0.027312418,
-              -0.010811127,
-              0.010405173,
-              -0.02275616,
-              0.11514236,
-              0.18532485,
-              -0.026541265
+              -0.062304743,
+              0.04315718,
+              -0.056847535,
+              0.03486019,
+              -0.045148205,
+              -0.1325256,
+              0.021795923,
+              0.039035086,
+              -0.048403695,
+              -0.03187157,
+              -0.03934502,
+              0.006355416,
+              0.07870429,
+              -0.004275144,
+              0.023635335,
+              -0.02171452,
+              -0.055756103,
+              -0.009452624,
+              0.03968397,
+              -0.11446917,
+              -0.011574315,
+              0.06161675,
+              -0.026243819,
+              0.024376081,
+              0.029439807,
+              -0.0035745306,
+              -0.0014413354,
+              -0.0031348146,
+              0.0137771955,
+              -0.00021878166,
+              -0.0148119675,
+              0.08438267,
+              0.06679146,
+              0.042289164,
+              0.0077238376,
+              0.073178865,
+              -0.008341517,
+              -0.094652176,
+              -0.09245101,
+              0.0075944075,
+              -0.07389992,
+              0.015481098,
+              -0.04405396,
+              -0.04497366,
+              -0.041315924,
+              0.06968346,
+              -0.027464444,
+              0.014380017,
+              -0.036109854,
+              -0.006690219,
+              -0.080297194,
+              -5.8296577e-05,
+              -0.03897778,
+              -0.049029846,
+              0.017797105,
+              -0.0064906515,
+              0.05977029,
+              -0.0031445406,
+              -0.024804324,
+              -0.114971094,
+              -0.047434244,
+              0.018489277,
+              -0.009801151,
+              0.09573786,
+              -0.009445709,
+              -0.035714474,
+              -0.031265706,
+              -0.0032087746,
+              0.07714283,
+              -0.076175354,
+              -0.11878057,
+              -0.06322687,
+              -0.0045974515,
+              0.06524851,
+              0.045755487,
+              -0.13797933,
+              0.045973603,
+              -0.03356543,
+              -0.013575197,
+              0.004536992,
+              0.01706251,
+              -0.0016689816,
+              -0.051292486,
+              0.10251468,
+              0.015364908,
+              -0.05339754,
+              0.046751976,
+              0.11428272,
+              -0.0060051866,
+              0.010296865,
+              -0.03160346,
+              -0.051935352,
+              0.02092994,
+              0.008887596,
+              -0.069010794,
+              0.08132733,
+              0.012102074,
+              -0.06409327,
+              -0.036342084,
+              0.046690084,
+              0.011248327,
+              -0.050334014,
+              0.073782355,
+              -0.02119414,
+              0.0324611,
+              -0.026148362,
+              0.06814877,
+              -0.03795885,
+              0.030811384,
+              -0.037118603,
+              -0.036956605,
+              -0.02943471,
+              -0.0328876,
+              -0.00579801,
+              0.04255975,
+              0.05469473,
+              -0.01927437,
+              0.12277417,
+              0.0037985598,
+              0.032079652,
+              0.023717156,
+              0.019211154,
+              0.019987307,
+              -0.012261412,
+              -0.032464176,
+              -0.004472998,
+              -0.03568547,
+              -6.953471e-33,
+              -0.02200053,
+              -0.06861985,
+              -0.035355665,
+              0.008892092,
+              0.07110619,
+              -0.02524488,
+              0.091491714,
+              -0.009333656,
+              -0.059515916,
+              -0.03471947,
+              0.04331791,
+              0.033350475,
+              0.02423151,
+              0.08795865,
+              0.020580785,
+              -0.00087637454,
+              -0.012995603,
+              0.088356934,
+              0.04568453,
+              0.025818799,
+              0.054319557,
+              0.09676607,
+              0.02314351,
+              0.024316499,
+              0.014192086,
+              -0.01867069,
+              -0.024500258,
+              -0.032566376,
+              0.025218401,
+              0.016804473,
+              -0.07628905,
+              0.012665322,
+              -0.021314982,
+              0.006895667,
+              0.030793479,
+              -0.00033363912,
+              0.0005291749,
+              -0.08589274,
+              0.040542576,
+              0.0062958263,
+              -0.009977536,
+              0.0016065374,
+              0.012649728,
+              -0.036491103,
+              -0.023085777,
+              0.012404348,
+              -0.0051287347,
+              0.020217113,
+              -0.08761001,
+              0.0451902,
+              -0.0012827619,
+              -0.06574815,
+              0.07477121,
+              0.08403992,
+              -0.01390955,
+              0.05589554,
+              0.019330526,
+              -0.019641383,
+              -0.016001293,
+              -0.02915193,
+              0.037374426,
+              0.068089314,
+              0.069200926,
+              -0.007668733,
+              0.021160824,
+              0.040417258,
+              0.035068225,
+              0.082075246,
+              0.08809441,
+              0.05050193,
+              -0.059343174,
+              0.04576526,
+              -0.025118835,
+              0.03583576,
+              -0.028081506,
+              0.019838363,
+              0.033905286,
+              -0.07977674,
+              0.023003135,
+              0.062460173,
+              -0.034886148,
+              -0.05390937,
+              -0.016114287,
+              -0.0057315156,
+              -0.03051132,
+              -0.02269694,
+              -0.010376983,
+              0.06762264,
+              -0.010560655,
+              -0.09605588,
+              -0.07854035,
+              -0.08528194,
+              0.029969428,
+              -0.0059528793,
+              -0.039581347,
+              2.9781768e-33,
+              0.011482255,
+              0.010417832,
+              -0.0698601,
+              0.019292813,
+              -0.08453582,
+              -0.08570265,
+              0.06624837,
+              0.063025005,
+              0.050434116,
+              0.033736084,
+              -0.0058885855,
+              -0.069622226,
+              0.12551048,
+              0.021380005,
+              0.07413853,
+              0.0342258,
+              -0.045818888,
+              0.014834041,
+              -0.012672501,
+              0.0036430089,
+              -0.08024709,
+              0.06730083,
+              -0.056032285,
+              -0.086702436,
+              -0.027874194,
+              -0.03391202,
+              -0.03872441,
+              -0.07792124,
+              -0.017794719,
+              0.061800934,
+              0.014696384,
+              0.019996569,
+              -0.08146178,
+              0.052340467,
+              0.06287676,
+              -0.0015751559,
+              0.040512506,
+              -0.027605608,
+              -0.009630798,
+              -0.017303543,
+              0.11392578,
+              0.044186074,
+              0.035317622,
+              0.12113664,
+              0.018812222,
+              0.049269576,
+              -0.036081262,
+              0.07789768,
+              -0.0296637,
+              -0.07068735,
+              -0.006731622,
+              0.0060941395,
+              0.042274125,
+              -0.039680813,
+              -0.048600707,
+              -0.03980193,
+              0.032409266,
+              0.03371183,
+              -0.092499994,
+              -0.049876206,
+              -0.06597403,
+              -0.042388365,
+              0.031259395,
+              0.011791109,
+              -0.04424881,
+              0.04685171,
+              -0.12302249,
+              -0.034650978,
+              -0.01387166,
+              -0.13122807,
+              0.1448325,
+              0.0056148693,
+              -0.0031096544,
+              0.022904772,
+              -0.07642485,
+              0.016454488,
+              -0.019540928,
+              -0.024970472,
+              -0.068574235,
+              0.07073104,
+              0.026643677,
+              -0.035163663,
+              -0.0015607082,
+              0.029314166,
+              -0.08943546,
+              -0.022545528,
+              -0.031130569,
+              0.053781237,
+              0.007896568,
+              0.023091432,
+              -0.0043701245,
+              0.05380369,
+              0.01729408,
+              0.05636822,
+              -0.05328019,
+              -1.3478804e-08,
+              -0.039678477,
+              0.013365443,
+              0.036817312,
+              0.009736139,
+              0.004703614,
+              0.06661744,
+              0.02291141,
+              -0.047423527,
+              -0.04049001,
+              0.0068159057,
+              0.008662143,
+              -0.006292634,
+              -0.045681197,
+              -0.06387613,
+              -0.013174571,
+              0.11696965,
+              0.016895585,
+              -0.0013498863,
+              0.023227682,
+              0.022274282,
+              0.07852807,
+              -0.04508963,
+              -0.009177306,
+              0.06640095,
+              -0.06651727,
+              -0.015498115,
+              0.054094598,
+              0.07642527,
+              0.0082470365,
+              -0.12409585,
+              0.01265297,
+              -0.017635401,
+              -0.020622984,
+              0.03250185,
+              -0.012997484,
+              0.022324847,
+              0.010529934,
+              -0.0883164,
+              0.021471445,
+              -0.0029947716,
+              -0.03183814,
+              0.0718419,
+              0.010377949,
+              0.0035974192,
+              0.048932698,
+              0.07039089,
+              -0.03657371,
+              -0.035186097,
+              -0.03655875,
+              -0.07017832,
+              -0.030322824,
+              0.028595895,
+              -0.019070871,
+              -0.0025186248,
+              0.021279149,
+              0.07436103,
+              -0.114249244,
+              -0.027311146,
+              -0.0107884705,
+              0.010422842,
+              -0.022787437,
+              0.11515081,
+              0.18532182,
+              -0.026544156
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/80e4404d8987.json b/tests/integration/recordings/responses/80e4404d8987.json
index 8cfe1836d..7eabfc363 100644
--- a/tests/integration/recordings/responses/80e4404d8987.json
+++ b/tests/integration/recordings/responses/80e4404d8987.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.463658Z",
+          "created_at": "2025-09-03T17:37:46.708948Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.51846Z",
+          "created_at": "2025-09-03T17:37:46.749031Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.569676Z",
+          "created_at": "2025-09-03T17:37:46.790192Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.621666Z",
+          "created_at": "2025-09-03T17:37:46.831093Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.675114Z",
+          "created_at": "2025-09-03T17:37:46.873135Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.727649Z",
+          "created_at": "2025-09-03T17:37:46.91375Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.780249Z",
+          "created_at": "2025-09-03T17:37:46.95439Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.834148Z",
+          "created_at": "2025-09-03T17:37:46.995224Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.885509Z",
+          "created_at": "2025-09-03T17:37:47.035887Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,15 +184,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:13:56.936635Z",
+          "created_at": "2025-09-03T17:37:47.076806Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1572591291,
-          "load_duration": 77121041,
+          "total_duration": 2069654958,
+          "load_duration": 177579833,
           "prompt_eval_count": 31,
-          "prompt_eval_duration": 1019000000,
+          "prompt_eval_duration": 1521851250,
           "eval_count": 10,
-          "eval_duration": 474000000,
+          "eval_duration": 369478042,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/8295382a8e7c.json b/tests/integration/recordings/responses/8295382a8e7c.json
index 6e1dc793d..6a38dde20 100644
--- a/tests/integration/recordings/responses/8295382a8e7c.json
+++ b/tests/integration/recordings/responses/8295382a8e7c.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-99",
+        "id": "chatcmpl-713",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "I'd be happy to help you test the OpenAI 2 architecture!\n\nOpenAI 2 is a neural network model developed by OpenAI, and it's not exactly possible for me to directly \"test\" it. However, I can guide you through a simplified example of how to verify if OpenAI 2 has been implemented correctly in a specific codebase.\n\nHere's an outline of the steps:\n\n1. **Understand the basics**: Before we dive into testing, make sure you understand the architectural and functional details of OpenAI 2.\n2. **Get access to the model**: You'll need to obtain a trained OpenAI 2 model or implement it from scratch using a language like PyTorch or TensorFlow.\n3. **Implement a validation framework**: Create a simple validation framework that uses common tasks, such as classification on the GLUE benchmark, to evaluate the performance of your OpenAI 2 model.\n\nHere's a simplified code example in PyTorch:\n```python\nimport torch\nfrom transformers import AutoModelForSequenceClassification, AutoTokenizer\n\n# Load pre-trained OpenAI 2 Model(s)\nmodel_name = \"github/openai/OpenAIAccelerated-Text-To-Speech\"\nmodel_class = AutoModelForSequenceClassification\ntokenizer = AutoTokenizer.from_pretrained(model_name)\n\n# Initialize the model and tokenizer\nmodel = model_class(pretrained=True, num_labels=8)  # adjust label number according to your task\ntokenizer = tokenizer\n\ndef evaluate_model():\n    batch_size = 100\n    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n    # Create a validation dataset from the GLUE benchmark\n    glue_datasets = [ datasets[\"glue\"][\"sst2\"], datasets[\"glue\"][\"mnli\"] ]\n    val_dataset = []\n    for i, gds in enumerate(glue_datasets):\n        data = gds[:10000]  # take only first few examples to speed up evaluation\n        input_ids = tokenizer encodings(data[\"sentence1\"], \n                                        attention_mask=data[\"attention_mask\"],\n                                        max_length=512,\n                                        padding=\"max_length\",\n                                        truncation=True,\n                                        return_tensors=\"pt\")\n\n        for example in data:\n            for sentence in [example['sentence1'], example['sentence2']]:\n                input_ids = input_ids.to(device)\n                outputs = model(input_ids, labels=None)  # adjust label to empty\n              \n\n    # Compute evaluation metrics\n    predictions = []\n    labels = []\n    accuracy = torch.zeros(8).to(device)\n\n    for sentence in data.values():\n        sentenceids = [input_ids[\"input_ids\"].flatten()]\n        _, pred_labels = model(sentenceids)\n        if len(predictions) == 0:\n            labels.extend([1, 2])\n        else:\n            assert len(labels)==len(sentences), 'error'\n            labels.append(preds[-1]) \n\n        # Append the prediction to the list\n        predictions.append(pred)\n\n    return accuracy\n\naccuracy = evaluate_model()\nprint(\"Accuracy:\", accuracy)\n```\n\nAfter running this code, you should get an estimate of the model's performance on the GLUE benchmark. Keep in mind that this is a simplified example and real-world openai 2 testing may require more involved validation processes.\n\nI hope this helps! Let me know if you have any further questions or if there are any specific areas where you'd like more information.",
+              "content": "I'd be happy to help you test the Transformer-XL (denoted as \"Test Trace OpenAI 2\") model, but first I need to clarify a few things:\n\n1. **Transformer-XL** is not an official name from OpenAI. It's actually a variant of the Transformer model proposed in the paper \"Long-Short Term Memory Are General: A Study on The Curvature of Time\" (2017) by Jinyu Chen, et al.\n2. **Trace OpenAI 2** sounds like a specific version or configuration of the Transformer-XL model, possibly developed by OpenAI.\n\nGiven these clarifications, I'll provide you with a general idea of how to test the Transformer-XL (or \"Test Trace OpenAI 2\") model using popular frameworks and libraries. Please note that this is not an exhaustive or definitive guide.\n\nTo test the Transformer-XL model, you can follow these steps:\n\n1. **Install the necessary dependencies**: You'll need a deep learning framework like TensorFlow or PyTorch, as well as a library for natural language processing (NLP) like Hugging Face's transformers.\n2. **Load the pre-trained weights**: You can use a pre-trained model checkpoint from Hugging Face's Transformers library or load your own weights trained on a specific task or dataset.\n3. **Prepare your data**: Load your text data into tokens, such as words or characters, and preprocess it according to the specific requirements of the Transformer-XL architecture (e.g., tokenization, padding, etc.).\n4. **Configure the model**: Adjust the hyperparameters to suit your specific test case, including the model's configuration, batch size, learning rate, etc.\n5. **Run the inference**: Use the loaded pre-trained weights to perform inference on your test data.\n\nHere's some sample Python code using PyTorch and Hugging Face's Transformers library to get you started:\n```python\nimport torch\nfrom transformers import LongformerForSequenceClassification, LongformerTokenizer\n\n# Load pre-trained weights\nmodel = LongformerForSequenceClassification.from_pretrained('test-trace-openai-2')\n\n# Prepare data\ntokenizer = model.tokenizer\ntext = \"This is a test sentence\"\ninputs = tokenizer(text, return_tensors='pt')\noutput = model(inputs['input_ids'], attention_mask=inputs['attention_mask'])\n\n# Print the results\nprint(output.logits)\n```\nPlease note that this code snippet is just an example and may not work as-is. You'll need to adapt it to your specific requirements and test data.\n\nKeep in mind that testing a model's performance on a specific task or dataset requires careful consideration of factors like:\n\n* **Test data quality**: Your test data should accurately represent the underlying distribution of your target dataset.\n* **Model evaluation metrics**: Choose relevant evaluation metrics that measure the model's performance on your specific task, such as accuracy, precision, recall, F1-score, etc.\n\nFeel free to ask if you have any further questions or need more guidance!",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,15 +37,15 @@
             }
           }
         ],
-        "created": 1754510064,
+        "created": 1756921250,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 694,
+          "completion_tokens": 614,
           "prompt_tokens": 31,
-          "total_tokens": 725,
+          "total_tokens": 645,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/836f51dfb3c5.json b/tests/integration/recordings/responses/836f51dfb3c5.json
index 833545737..85f3aff00 100644
--- a/tests/integration/recordings/responses/836f51dfb3c5.json
+++ b/tests/integration/recordings/responses/836f51dfb3c5.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:14:03.770002Z",
+        "created_at": "2025-09-03T17:37:51.562847Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 395965875,
-        "load_duration": 178888708,
+        "total_duration": 272296250,
+        "load_duration": 131747125,
         "prompt_eval_count": 214,
-        "prompt_eval_duration": 170000000,
+        "prompt_eval_duration": 124006709,
         "eval_count": 2,
-        "eval_duration": 44000000,
+        "eval_duration": 15572291,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/840fbb380b73.json b/tests/integration/recordings/responses/840fbb380b73.json
index a3fb7ccd8..4367d8788 100644
--- a/tests/integration/recordings/responses/840fbb380b73.json
+++ b/tests/integration/recordings/responses/840fbb380b73.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:13:57.935921Z",
+        "created_at": "2025-09-03T17:37:47.871962Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 313787333,
-        "load_duration": 89797542,
+        "total_duration": 301629042,
+        "load_duration": 102832917,
         "prompt_eval_count": 233,
-        "prompt_eval_duration": 167000000,
+        "prompt_eval_duration": 154806625,
         "eval_count": 5,
-        "eval_duration": 55000000,
+        "eval_duration": 43361542,
         "response": "unsafe\nS1",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/84cab42e1f5c.json b/tests/integration/recordings/responses/84cab42e1f5c.json
index 423dd16da..611e67218 100644
--- a/tests/integration/recordings/responses/84cab42e1f5c.json
+++ b/tests/integration/recordings/responses/84cab42e1f5c.json
@@ -17,7 +17,7 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -26,7 +26,7 @@
               "text": "Blue"
             }
           ],
-          "created": 1754348148,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -36,7 +36,7 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -45,7 +45,7 @@
               "text": ".\n\n"
             }
           ],
-          "created": 1754348148,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -55,7 +55,7 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -64,7 +64,7 @@
               "text": "My"
             }
           ],
-          "created": 1754348148,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -74,16 +74,16 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
               "index": 0,
               "logprobs": null,
-              "text": " response"
+              "text": " answer"
             }
           ],
-          "created": 1754348148,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -93,7 +93,7 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -102,7 +102,7 @@
               "text": " is"
             }
           ],
-          "created": 1754348148,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -112,634 +112,7 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " based"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " on"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " a"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " common"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " English"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " rhyme"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " or"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " poem"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " that"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " completes"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " the"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " sentence"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " with"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " the"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " word"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " \""
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": "blue"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": "\"."
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " The"
-            }
-          ],
-          "created": 1754348149,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " complete"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " phrase"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " is"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": ":"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " \""
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": "R"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": "oses"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " are"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " red"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": ","
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " v"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": "io"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": "lets"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
-          "choices": [
-            {
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null,
-              "text": " are"
-            }
-          ],
-          "created": 1754348150,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "text_completion",
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.completion.Completion",
-        "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -748,7 +121,7 @@
               "text": " blue"
             }
           ],
-          "created": 1754348150,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -758,16 +131,16 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
               "index": 0,
               "logprobs": null,
-              "text": "\".\n\n"
+              "text": " because"
             }
           ],
-          "created": 1754348150,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -777,16 +150,16 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
               "index": 0,
               "logprobs": null,
-              "text": "The"
+              "text": " it"
             }
           ],
-          "created": 1754348150,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -796,16 +169,16 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
               "index": 0,
               "logprobs": null,
-              "text": " use"
+              "text": "'s"
             }
           ],
-          "created": 1754348150,
+          "created": 1756921025,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -815,7 +188,121 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " a"
+            }
+          ],
+          "created": 1756921025,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " common"
+            }
+          ],
+          "created": 1756921025,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " and"
+            }
+          ],
+          "created": 1756921025,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " well"
+            }
+          ],
+          "created": 1756921025,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": "-known"
+            }
+          ],
+          "created": 1756921025,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " completion"
+            }
+          ],
+          "created": 1756921025,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -824,7 +311,7 @@
               "text": " of"
             }
           ],
-          "created": 1754348151,
+          "created": 1756921026,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -834,7 +321,7 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -843,7 +330,7 @@
               "text": " the"
             }
           ],
-          "created": 1754348151,
+          "created": 1756921026,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -853,16 +340,16 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
               "index": 0,
               "logprobs": null,
-              "text": " word"
+              "text": " classic"
             }
           ],
-          "created": 1754348151,
+          "created": 1756921026,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -872,7 +359,64 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " tongue"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": "-tw"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": "ister"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -881,7 +425,7 @@
               "text": " \""
             }
           ],
-          "created": 1754348151,
+          "created": 1756921026,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -891,16 +435,16 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
               "index": 0,
               "logprobs": null,
-              "text": "blue"
+              "text": "R"
             }
           ],
-          "created": 1754348151,
+          "created": 1756921026,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -910,7 +454,159 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": "oses"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " are"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " red"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": ","
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " v"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": "io"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": "lets"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " are"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -919,7 +615,7 @@
               "text": "\""
             }
           ],
-          "created": 1754348151,
+          "created": 1756921026,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -929,7 +625,292 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " \u2013"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " often"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " followed"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " by"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " the"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " phrase"
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " \""
+            }
+          ],
+          "created": 1756921026,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": "blue"
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": ".\""
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " This"
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " rhyme"
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " has"
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " been"
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " widely"
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": " used"
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
@@ -938,7 +919,7 @@
               "text": " in"
             }
           ],
-          "created": 1754348151,
+          "created": 1756921027,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -948,16 +929,16 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": null,
               "index": 0,
               "logprobs": null,
-              "text": " this"
+              "text": " literature"
             }
           ],
-          "created": 1754348151,
+          "created": 1756921027,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
@@ -967,7 +948,26 @@
       {
         "__type__": "openai.types.completion.Completion",
         "__data__": {
-          "id": "cmpl-905",
+          "id": "cmpl-374",
+          "choices": [
+            {
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "text": ","
+            }
+          ],
+          "created": 1756921027,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "text_completion",
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.completion.Completion",
+        "__data__": {
+          "id": "cmpl-374",
           "choices": [
             {
               "finish_reason": "length",
@@ -976,7 +976,7 @@
               "text": ""
             }
           ],
-          "created": 1754348151,
+          "created": 1756921027,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "text_completion",
           "system_fingerprint": "fp_ollama",
diff --git a/tests/integration/recordings/responses/85594a69d74a.json b/tests/integration/recordings/responses/85594a69d74a.json
index 286b8da11..c4a01bc33 100644
--- a/tests/integration/recordings/responses/85594a69d74a.json
+++ b/tests/integration/recordings/responses/85594a69d74a.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:54.634929Z",
+        "created_at": "2025-09-03T17:37:36.046489Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 233222375,
-        "load_duration": 136303125,
+        "total_duration": 198969250,
+        "load_duration": 110421000,
         "prompt_eval_count": 213,
-        "prompt_eval_duration": 78000000,
+        "prompt_eval_duration": 76196541,
         "eval_count": 2,
-        "eval_duration": 17000000,
+        "eval_duration": 11832042,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/97d3812bfccb.json b/tests/integration/recordings/responses/97d3812bfccb.json
index 8a9b076fd..11e0fb402 100644
--- a/tests/integration/recordings/responses/97d3812bfccb.json
+++ b/tests/integration/recordings/responses/97d3812bfccb.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:14:06.082832Z",
+        "created_at": "2025-09-03T17:37:52.965106Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 421905083,
-        "load_duration": 88557750,
+        "total_duration": 376594792,
+        "load_duration": 158273792,
         "prompt_eval_count": 217,
-        "prompt_eval_duration": 278000000,
+        "prompt_eval_duration": 177001375,
         "eval_count": 5,
-        "eval_duration": 54000000,
+        "eval_duration": 40927500,
         "response": "unsafe\nS1",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/97e259c0d3e5.json b/tests/integration/recordings/responses/97e259c0d3e5.json
index cd083c9a8..2e47bca80 100644
--- a/tests/integration/recordings/responses/97e259c0d3e5.json
+++ b/tests/integration/recordings/responses/97e259c0d3e5.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.138696Z",
+          "created_at": "2025-09-03T17:37:53.505006Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.195013Z",
+          "created_at": "2025-09-03T17:37:53.547032Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.246591Z",
+          "created_at": "2025-09-03T17:37:53.588985Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.29736Z",
+          "created_at": "2025-09-03T17:37:53.631139Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.347941Z",
+          "created_at": "2025-09-03T17:37:53.67269Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.399151Z",
+          "created_at": "2025-09-03T17:37:53.714798Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.452488Z",
+          "created_at": "2025-09-03T17:37:53.756492Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.50538Z",
+          "created_at": "2025-09-03T17:37:53.798115Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.558656Z",
+          "created_at": "2025-09-03T17:37:53.840012Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.610408Z",
+          "created_at": "2025-09-03T17:37:53.882555Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.66358Z",
+          "created_at": "2025-09-03T17:37:53.924566Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.717638Z",
+          "created_at": "2025-09-03T17:37:53.966279Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,7 +238,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.769423Z",
+          "created_at": "2025-09-03T17:37:54.008483Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -256,7 +256,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.819395Z",
+          "created_at": "2025-09-03T17:37:54.050042Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -274,7 +274,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.871391Z",
+          "created_at": "2025-09-03T17:37:54.092416Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -292,7 +292,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.924892Z",
+          "created_at": "2025-09-03T17:37:54.134857Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -310,7 +310,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:07.976557Z",
+          "created_at": "2025-09-03T17:37:54.176408Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -328,7 +328,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:08.029579Z",
+          "created_at": "2025-09-03T17:37:54.217553Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -346,15 +346,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:08.082749Z",
+          "created_at": "2025-09-03T17:37:54.259141Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1425800209,
-          "load_duration": 138858459,
+          "total_duration": 1008303875,
+          "load_duration": 119709875,
           "prompt_eval_count": 384,
-          "prompt_eval_duration": 340000000,
+          "prompt_eval_duration": 132645959,
           "eval_count": 19,
-          "eval_duration": 945000000,
+          "eval_duration": 755215708,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/9c140a29ae09.json b/tests/integration/recordings/responses/9c140a29ae09.json
index 41b070cc5..a436484d7 100644
--- a/tests/integration/recordings/responses/9c140a29ae09.json
+++ b/tests/integration/recordings/responses/9c140a29ae09.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:09.83858Z",
+          "created_at": "2025-09-03T17:37:55.13567Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:09.891488Z",
+          "created_at": "2025-09-03T17:37:55.17774Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:09.945656Z",
+          "created_at": "2025-09-03T17:37:55.220061Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:09.996898Z",
+          "created_at": "2025-09-03T17:37:55.261406Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.053632Z",
+          "created_at": "2025-09-03T17:37:55.302615Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.105753Z",
+          "created_at": "2025-09-03T17:37:55.343879Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.157953Z",
+          "created_at": "2025-09-03T17:37:55.384951Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.210869Z",
+          "created_at": "2025-09-03T17:37:55.426563Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.263387Z",
+          "created_at": "2025-09-03T17:37:55.467648Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.317794Z",
+          "created_at": "2025-09-03T17:37:55.509469Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.373978Z",
+          "created_at": "2025-09-03T17:37:55.552302Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.429702Z",
+          "created_at": "2025-09-03T17:37:55.596236Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,15 +238,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:10.483762Z",
+          "created_at": "2025-09-03T17:37:55.637816Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1041142084,
-          "load_duration": 110407459,
+          "total_duration": 726849208,
+          "load_duration": 147625750,
           "prompt_eval_count": 415,
-          "prompt_eval_duration": 283000000,
+          "prompt_eval_duration": 75722709,
           "eval_count": 13,
-          "eval_duration": 646000000,
+          "eval_duration": 502787333,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/9c28ec9ac338.json b/tests/integration/recordings/responses/9c28ec9ac338.json
index c71e798d2..45bfebee5 100644
--- a/tests/integration/recordings/responses/9c28ec9ac338.json
+++ b/tests/integration/recordings/responses/9c28ec9ac338.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.316207Z",
+          "created_at": "2025-09-03T17:34:23.434819Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.358611Z",
+          "created_at": "2025-09-03T17:34:23.477986Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.401272Z",
+          "created_at": "2025-09-03T17:34:23.520282Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.444321Z",
+          "created_at": "2025-09-03T17:34:23.561947Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.48795Z",
+          "created_at": "2025-09-03T17:34:23.603986Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.530158Z",
+          "created_at": "2025-09-03T17:34:23.646447Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.573318Z",
+          "created_at": "2025-09-03T17:34:23.688452Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.616297Z",
+          "created_at": "2025-09-03T17:34:23.730147Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.659527Z",
+          "created_at": "2025-09-03T17:34:23.772004Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.702422Z",
+          "created_at": "2025-09-03T17:34:23.813913Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,7 +201,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.745894Z",
+          "created_at": "2025-09-03T17:34:23.856Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -219,7 +219,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.788811Z",
+          "created_at": "2025-09-03T17:34:23.897939Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -237,7 +237,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.831618Z",
+          "created_at": "2025-09-03T17:34:23.939953Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -255,7 +255,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.874469Z",
+          "created_at": "2025-09-03T17:34:23.982033Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -273,7 +273,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.917372Z",
+          "created_at": "2025-09-03T17:34:24.026067Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -291,7 +291,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.960558Z",
+          "created_at": "2025-09-03T17:34:24.069083Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -309,7 +309,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:37.004223Z",
+          "created_at": "2025-09-03T17:34:24.112349Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -327,15 +327,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:37.046563Z",
+          "created_at": "2025-09-03T17:34:24.155424Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 845522667,
-          "load_duration": 47784875,
+          "total_duration": 896931125,
+          "load_duration": 89697291,
           "prompt_eval_count": 511,
-          "prompt_eval_duration": 66135292,
+          "prompt_eval_duration": 83876750,
           "eval_count": 18,
-          "eval_duration": 730999291,
+          "eval_duration": 722156292,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/9e651e5fcfe2.json b/tests/integration/recordings/responses/9e651e5fcfe2.json
index f510f3a6e..6accc38fa 100644
--- a/tests/integration/recordings/responses/9e651e5fcfe2.json
+++ b/tests/integration/recordings/responses/9e651e5fcfe2.json
@@ -23,1560 +23,1560 @@
         "data": [
           {
             "embedding": [
-              -0.07449307,
-              0.027951928,
-              -0.026060246,
-              0.028483065,
-              -0.048791632,
-              -0.12451073,
-              -0.037688024,
-              0.041220777,
-              -0.048782747,
-              -0.027790926,
-              -0.092681944,
-              0.052037407,
-              0.08095267,
-              0.023185384,
-              0.10326959,
-              -0.061368585,
-              -0.046598755,
-              0.031270534,
-              -0.009005052,
-              -0.111023106,
-              -0.020844607,
-              0.0365254,
-              -0.013400216,
-              0.007603707,
-              0.019496046,
-              0.004319023,
-              -0.012447805,
-              -0.04465679,
-              -9.841689e-05,
-              0.027754154,
-              -0.052329242,
-              0.06209096,
-              0.019665342,
-              0.022347461,
-              -0.018723859,
-              0.06644313,
-              -0.037004728,
-              -0.09444654,
-              -0.050066303,
-              -0.016110398,
-              -0.089189,
-              0.07288855,
-              -0.07318861,
-              -0.027522061,
-              -0.066324726,
-              0.015509758,
-              -0.0042457446,
-              -0.03252355,
-              -0.035831843,
-              -0.026272034,
-              -0.09124794,
-              0.022858502,
-              -0.056080233,
-              -0.103500344,
-              -0.023473406,
-              -0.016338969,
-              0.06030296,
-              -0.0120581165,
-              -0.009729192,
-              -0.15205215,
-              -0.07315331,
-              0.022419574,
-              0.08820763,
-              0.062114313,
-              -0.04762322,
-              -0.05541787,
-              -0.036066234,
-              0.017759612,
-              0.08481655,
-              -0.05053196,
-              -0.09962307,
-              -0.029446559,
-              -0.0021580544,
-              0.08140918,
-              0.03067005,
-              -0.12171203,
-              0.046307985,
-              0.005336976,
-              -0.0076234527,
-              0.049193826,
-              0.0009906195,
-              0.018153494,
-              -0.056338865,
-              0.0908365,
-              0.03551559,
-              -0.062860996,
-              0.0518074,
-              0.071721554,
-              -0.045374844,
-              0.009667945,
-              0.030433532,
-              -0.05885662,
-              0.03727969,
-              0.0041508353,
-              -0.014315319,
-              0.062025562,
-              0.026427185,
-              -0.054075267,
-              -0.04068261,
-              0.010823117,
-              -0.0032635517,
-              -0.077452675,
-              0.055320397,
-              0.011208057,
-              0.049934894,
-              0.011137414,
-              0.044191435,
-              -0.08876309,
-              0.04791029,
-              -0.029189063,
-              -0.021350788,
-              -0.058955453,
-              -0.0060216836,
-              -0.03632618,
-              0.045660086,
-              0.07383026,
-              -0.0043607675,
-              0.07589455,
-              -0.0005572796,
-              0.0063479175,
-              0.019868094,
-              -0.008913204,
-              -0.007406098,
-              -0.014949887,
-              0.012402974,
-              0.0032334107,
-              -0.009926773,
-              1.525028e-33,
-              -0.03028342,
-              -0.05685508,
-              -0.009895807,
-              0.022367567,
-              0.05730986,
-              -0.018540345,
-              0.078504145,
-              -0.0036667767,
-              -0.031108411,
-              -0.0333193,
-              0.019241981,
-              0.037178107,
-              0.030919006,
-              0.13797465,
-              -0.0026615814,
-              0.00626278,
-              0.023982357,
-              0.02884277,
-              0.011378185,
-              0.003017119,
-              0.009753849,
-              -0.010310673,
-              0.025471263,
-              0.04401538,
-              0.008264411,
-              -0.023294613,
-              -0.02543755,
-              -0.022366447,
-              0.016387654,
-              0.0039752712,
-              -0.06696038,
-              -0.059061013,
-              -0.026061574,
-              0.025640154,
-              -0.024006085,
-              -0.015399723,
-              -0.013001841,
-              -0.08129873,
-              0.029804442,
-              -0.0047991537,
-              -0.021450322,
-              0.025900915,
-              0.0044511827,
-              -0.013483615,
-              -0.014909116,
-              0.0462146,
-              -0.0003121182,
-              0.017148994,
-              -0.121784754,
-              0.02112702,
-              -0.009525965,
-              -0.035118576,
-              0.08002826,
-              0.08460527,
-              0.0020599784,
-              0.051269483,
-              0.052960806,
-              0.032629956,
-              -0.04172868,
-              -0.055450223,
-              0.014603321,
-              0.034458637,
-              0.095163934,
-              0.004940245,
-              0.038055513,
-              0.064066105,
-              0.037084144,
-              0.117337674,
-              0.04749384,
-              0.062727995,
-              -0.043873455,
-              0.03940274,
-              -0.041489355,
-              0.045208808,
-              -0.005673402,
-              0.028298998,
-              0.035084575,
-              -0.11161549,
-              0.06762898,
-              0.025535477,
-              -0.016374003,
-              -0.023129083,
-              0.025620162,
-              -0.034770124,
-              -0.014257682,
-              -0.04390796,
-              -0.006200332,
-              0.04474309,
-              -0.0072586853,
-              -0.038618132,
-              -0.06358841,
-              -0.05306046,
-              0.044273335,
-              0.024379753,
-              -0.013372279,
-              -5.162782e-33,
-              -0.01137177,
-              -0.0038401731,
-              -0.046551347,
-              0.0008104445,
-              -0.09031019,
-              -0.06308892,
-              0.009730625,
-              0.00016963277,
-              0.043050725,
-              0.022217263,
-              -0.04910803,
-              -0.08518463,
-              0.11067566,
-              0.017678969,
-              0.05608959,
-              0.037217773,
-              -0.11399499,
-              0.011297513,
-              0.010620838,
-              0.035015386,
-              -0.074024685,
-              0.015696649,
-              -0.032765005,
-              -0.06483389,
-              -0.010750767,
-              -0.04140643,
-              -0.09720136,
-              -0.07026117,
-              0.021630345,
-              0.050262064,
-              -0.01796077,
-              0.03200972,
-              -0.03785568,
-              0.031321034,
-              0.07589453,
-              -0.00090503925,
-              0.035030376,
-              -0.06255562,
-              -0.006917408,
-              -0.026772378,
-              0.116618186,
-              0.050241243,
-              0.06521753,
-              0.06511879,
-              0.025131317,
-              0.031826124,
-              -0.059561018,
-              0.08187109,
-              -0.027979838,
-              -0.04847714,
-              -0.034865912,
-              0.03014605,
-              0.035055622,
-              -0.018549602,
-              -0.038735136,
-              -0.04888224,
-              0.02115399,
-              0.08302824,
-              -0.06755719,
-              -0.053532355,
-              -0.08100928,
-              -0.06342726,
-              0.01134464,
-              0.020696267,
-              -0.06569805,
-              0.02215437,
-              -0.107759416,
-              -0.011531022,
-              -0.052023083,
-              -0.15014696,
-              0.11523642,
-              -0.030628026,
-              -0.018693298,
-              0.05293893,
-              -0.066821866,
-              0.040430665,
-              -0.028188393,
-              -0.016445817,
-              -0.025638778,
-              0.065690935,
-              0.08657344,
-              0.010824949,
-              -0.038753588,
-              0.027475704,
-              -0.06717005,
-              -0.015260354,
-              -0.05266386,
-              0.02095537,
-              0.0314708,
-              0.0028445746,
-              0.010277572,
-              0.04829579,
-              0.02202069,
-              0.01687653,
-              -0.022683937,
-              -4.070874e-08,
-              -0.0068096938,
-              0.0014505221,
-              0.0538663,
-              0.015128973,
-              0.017920515,
-              0.08120387,
-              0.0054989015,
-              -0.037012283,
-              -0.018747889,
-              0.051839896,
-              -0.01485388,
-              -0.04494068,
-              -0.092807755,
-              -0.07264074,
-              -0.0042969217,
-              0.14135452,
-              -0.022500824,
-              -0.0304894,
-              0.047428515,
-              0.06622567,
-              0.07943656,
-              -0.022952257,
-              -0.053804893,
-              0.10411883,
-              -0.08483286,
-              -0.03217885,
-              0.058469053,
-              0.0037233643,
-              -0.029061304,
-              -0.093473285,
-              -0.0041507743,
-              -0.035646018,
-              0.007173623,
-              0.040360082,
-              0.04552733,
-              0.018294893,
-              0.021491595,
-              -0.05992459,
-              -0.02806498,
-              0.018094081,
-              -0.02130419,
-              -0.003922083,
-              0.012168674,
-              -0.016664261,
-              0.021637399,
-              0.02437987,
-              -0.044396017,
-              -0.047764827,
-              -0.057788223,
-              -0.0577456,
-              -0.0060329973,
-              -0.010019745,
-              -0.016522264,
-              -0.049803738,
-              0.020510556,
-              0.07658504,
-              -0.1371851,
-              0.008845452,
-              -0.032027397,
-              0.035882812,
-              -0.0063640904,
-              0.11211461,
-              0.15690215,
-              -0.00068062195
+              -0.07448108,
+              0.027982691,
+              -0.025962545,
+              0.028414156,
+              -0.04874927,
+              -0.124489374,
+              -0.03775365,
+              0.041172747,
+              -0.048783444,
+              -0.027774421,
+              -0.09272271,
+              0.051921174,
+              0.08087506,
+              0.023085767,
+              0.103185095,
+              -0.06142812,
+              -0.046623003,
+              0.031264473,
+              -0.009095788,
+              -0.110987656,
+              -0.020735977,
+              0.036462996,
+              -0.013348663,
+              0.007442654,
+              0.019446686,
+              0.0043880027,
+              -0.0123794135,
+              -0.04474342,
+              -0.00010696763,
+              0.027796188,
+              -0.05249273,
+              0.062042117,
+              0.019623421,
+              0.022298045,
+              -0.01876838,
+              0.06636658,
+              -0.036940884,
+              -0.09439301,
+              -0.04989112,
+              -0.016055813,
+              -0.08934105,
+              0.07278765,
+              -0.073312856,
+              -0.027571253,
+              -0.06639977,
+              0.015506035,
+              -0.004176694,
+              -0.032542672,
+              -0.035769954,
+              -0.026245229,
+              -0.09129098,
+              0.022831371,
+              -0.05601971,
+              -0.103505865,
+              -0.023430603,
+              -0.01617043,
+              0.060298156,
+              -0.011999374,
+              -0.00982143,
+              -0.15203232,
+              -0.07311755,
+              0.022391053,
+              0.08800625,
+              0.062195398,
+              -0.04764835,
+              -0.05545306,
+              -0.036078423,
+              0.017782934,
+              0.08492913,
+              -0.050706394,
+              -0.09958507,
+              -0.029495796,
+              -0.002121337,
+              0.08148674,
+              0.030521393,
+              -0.12159759,
+              0.04639748,
+              0.0054555144,
+              -0.0076237656,
+              0.04930283,
+              0.001018987,
+              0.01823945,
+              -0.056388717,
+              0.09080432,
+              0.03544767,
+              -0.062846325,
+              0.05177355,
+              0.07175976,
+              -0.045391884,
+              0.009686718,
+              0.030302709,
+              -0.058896482,
+              0.03719664,
+              0.004174063,
+              -0.014313601,
+              0.06214871,
+              0.026443055,
+              -0.054081496,
+              -0.04056011,
+              0.010876058,
+              -0.0033277434,
+              -0.07736001,
+              0.055489365,
+              0.011366925,
+              0.049955327,
+              0.011093621,
+              0.044155005,
+              -0.08873286,
+              0.04789806,
+              -0.029256178,
+              -0.021238709,
+              -0.059048988,
+              -0.006010105,
+              -0.036286995,
+              0.045776833,
+              0.07393597,
+              -0.0043319017,
+              0.07591234,
+              -0.0006300352,
+              0.0063326987,
+              0.019833053,
+              -0.008920521,
+              -0.0074224886,
+              -0.014964156,
+              0.012450781,
+              0.003317517,
+              -0.009942644,
+              1.525195e-33,
+              -0.030182399,
+              -0.056817565,
+              -0.009954876,
+              0.02231213,
+              0.057156544,
+              -0.018560076,
+              0.07843683,
+              -0.003509288,
+              -0.031122614,
+              -0.0333474,
+              0.019342642,
+              0.03716782,
+              0.030942772,
+              0.13801146,
+              -0.0026788223,
+              0.0060844175,
+              0.024037478,
+              0.028806396,
+              0.0114514725,
+              0.0028755309,
+              0.009741409,
+              -0.010365574,
+              0.025636459,
+              0.04402703,
+              0.00824972,
+              -0.023288164,
+              -0.025415357,
+              -0.02247272,
+              0.016395057,
+              0.0039686435,
+              -0.06683203,
+              -0.058984432,
+              -0.026139224,
+              0.02571613,
+              -0.023981044,
+              -0.01542635,
+              -0.013025425,
+              -0.08132036,
+              0.029904919,
+              -0.0048653325,
+              -0.02163821,
+              0.025880665,
+              0.004492511,
+              -0.013551861,
+              -0.014834658,
+              0.046109095,
+              -0.00031146017,
+              0.016851023,
+              -0.12182429,
+              0.021024965,
+              -0.009434213,
+              -0.03510208,
+              0.080137864,
+              0.08463277,
+              0.0019426581,
+              0.051176246,
+              0.05314091,
+              0.032667853,
+              -0.041880205,
+              -0.05545038,
+              0.014655727,
+              0.034564327,
+              0.09517278,
+              0.0048721586,
+              0.038064517,
+              0.064016655,
+              0.036886543,
+              0.11732628,
+              0.04750395,
+              0.062849574,
+              -0.043793496,
+              0.039535545,
+              -0.0414883,
+              0.045276705,
+              -0.005626682,
+              0.028326502,
+              0.03510831,
+              -0.11158364,
+              0.067508236,
+              0.025473768,
+              -0.016454473,
+              -0.023138152,
+              0.02560681,
+              -0.03489655,
+              -0.0143142305,
+              -0.043763783,
+              -0.006103266,
+              0.044694975,
+              -0.007177529,
+              -0.038755096,
+              -0.06350946,
+              -0.05295245,
+              0.044151388,
+              0.024555689,
+              -0.01345332,
+              -5.1627547e-33,
+              -0.011461753,
+              -0.003969141,
+              -0.04658726,
+              0.0008026091,
+              -0.090269305,
+              -0.0629358,
+              0.009687034,
+              0.00015354449,
+              0.043152034,
+              0.022057066,
+              -0.049155302,
+              -0.08511033,
+              0.110782035,
+              0.017681966,
+              0.056186423,
+              0.03724774,
+              -0.114085265,
+              0.011197734,
+              0.010572792,
+              0.03503156,
+              -0.07397689,
+              0.0156148635,
+              -0.032688703,
+              -0.06490581,
+              -0.010675779,
+              -0.041401856,
+              -0.097037986,
+              -0.07025277,
+              0.021750104,
+              0.05030694,
+              -0.017832309,
+              0.032031614,
+              -0.03788665,
+              0.03141082,
+              0.07613352,
+              -0.0007763451,
+              0.034961626,
+              -0.06256205,
+              -0.006801991,
+              -0.026741587,
+              0.11656076,
+              0.05023973,
+              0.06515106,
+              0.06511257,
+              0.025219081,
+              0.03180813,
+              -0.05966658,
+              0.08190675,
+              -0.028054262,
+              -0.048548922,
+              -0.03486897,
+              0.03020514,
+              0.035033725,
+              -0.018610824,
+              -0.038684692,
+              -0.048875436,
+              0.021133669,
+              0.08319505,
+              -0.06746284,
+              -0.053462982,
+              -0.08098418,
+              -0.06340421,
+              0.011191566,
+              0.020785637,
+              -0.06575731,
+              0.02211741,
+              -0.10775702,
+              -0.011597437,
+              -0.051947355,
+              -0.1501959,
+              0.11516611,
+              -0.030521782,
+              -0.018723903,
+              0.052845538,
+              -0.06679985,
+              0.040416736,
+              -0.028146135,
+              -0.01644884,
+              -0.025731068,
+              0.06570538,
+              0.0866128,
+              0.010937938,
+              -0.03865133,
+              0.027389226,
+              -0.06712724,
+              -0.015267271,
+              -0.05265448,
+              0.020899015,
+              0.031420153,
+              0.002802588,
+              0.010436373,
+              0.048363067,
+              0.021981295,
+              0.01690293,
+              -0.022728851,
+              -4.0744272e-08,
+              -0.0065167644,
+              0.0014059767,
+              0.05391456,
+              0.015178632,
+              0.018086514,
+              0.08112959,
+              0.005525823,
+              -0.037069544,
+              -0.01871401,
+              0.051793523,
+              -0.014797383,
+              -0.044994324,
+              -0.09279006,
+              -0.07259356,
+              -0.004214306,
+              0.14136177,
+              -0.022566888,
+              -0.030480398,
+              0.047431417,
+              0.06623071,
+              0.07947818,
+              -0.023033215,
+              -0.05389834,
+              0.10418305,
+              -0.08498801,
+              -0.032223985,
+              0.058419,
+              0.0036608635,
+              -0.02912376,
+              -0.09348434,
+              -0.004131768,
+              -0.035598896,
+              0.007222825,
+              0.040373847,
+              0.04553802,
+              0.018402338,
+              0.021517321,
+              -0.06000489,
+              -0.028075347,
+              0.018188315,
+              -0.021463133,
+              -0.003939297,
+              0.012185079,
+              -0.016664179,
+              0.021595497,
+              0.02443412,
+              -0.044382285,
+              -0.047587246,
+              -0.057701204,
+              -0.057771184,
+              -0.0060019926,
+              -0.0099875815,
+              -0.016420204,
+              -0.049889106,
+              0.020464808,
+              0.076619074,
+              -0.13720629,
+              0.00883673,
+              -0.032044746,
+              0.035911836,
+              -0.006365476,
+              0.11197782,
+              0.15684035,
+              -0.00079191517
             ],
             "index": 0,
             "object": "embedding"
           },
           {
             "embedding": [
-              -0.0011845493,
-              0.013266878,
-              0.03609042,
-              0.047072034,
-              -0.008352954,
-              -0.0122682275,
-              0.017132185,
-              -0.014473443,
-              -0.06756814,
-              0.013247742,
-              -0.07102911,
-              0.021882167,
-              0.048140433,
-              -0.06663474,
-              -0.029968074,
-              0.0146699,
-              0.042884044,
-              0.031221654,
-              -0.06519409,
-              -0.07393237,
-              0.017278695,
-              -0.015300585,
-              -0.052712914,
-              0.063471325,
-              0.005261093,
-              0.026454475,
-              0.036750335,
-              0.048913635,
-              -0.0043701017,
-              0.010404101,
-              -0.00899726,
-              -0.07210333,
-              0.0508586,
-              0.017407527,
-              -0.06129139,
-              -0.010193845,
-              -0.06584968,
-              0.06993935,
-              0.028308308,
-              -0.037110034,
-              -0.05215759,
-              -0.07382648,
-              0.023526125,
-              -0.025393125,
-              0.061842058,
-              0.115891784,
-              -0.08308006,
-              -0.088689096,
-              -0.045506753,
-              0.021837203,
-              -0.12331834,
-              -0.02362818,
-              -0.0015319391,
-              -0.013698963,
-              -0.056246556,
-              0.088307984,
-              0.03336545,
-              0.051764306,
-              0.007479521,
-              -0.025192864,
-              0.023220513,
-              -0.15522671,
-              -0.010666595,
-              0.016220143,
-              0.034197047,
-              0.020141115,
-              -0.02228778,
-              0.050806805,
-              -0.0054491716,
-              -0.04010184,
-              -0.020381475,
-              0.101001725,
-              0.0030050839,
-              0.066215865,
-              0.040159617,
-              -0.019853236,
-              -0.059809405,
-              -0.06364045,
-              0.08465813,
-              0.023686064,
-              -0.017249556,
-              -0.005799871,
-              -0.02653176,
-              0.092887536,
-              0.048390586,
-              -0.068729825,
-              -0.022274029,
-              -0.01541849,
-              -0.011106163,
-              -0.017558511,
-              0.025275087,
-              -0.039419167,
-              -0.0013605524,
-              -0.040891252,
-              -0.03210248,
-              0.04157447,
-              0.009033561,
-              -0.1375085,
-              0.0302998,
-              0.058144268,
-              0.010614374,
-              0.09235676,
-              -0.035921294,
-              -0.0035614434,
-              0.056328356,
-              -0.003870427,
-              0.035673276,
-              0.014662149,
-              0.106206276,
-              -0.13588227,
-              -0.05821538,
-              0.045162544,
-              -0.069754794,
-              -0.05015353,
-              -0.04111925,
-              0.012403055,
-              -0.040746994,
-              0.028958116,
-              -0.022099715,
-              0.08722799,
-              -0.009660439,
-              -0.02553313,
-              0.011424866,
-              0.03355087,
-              0.021934206,
-              -0.08680693,
-              -0.07095944,
-              1.7813879e-33,
-              -0.041105658,
-              -0.10025705,
-              0.0064499485,
-              0.0037606815,
-              0.029249465,
-              -0.08724099,
-              -0.042814564,
-              -0.065751046,
-              0.01803772,
-              0.022158695,
-              -0.03251517,
-              -0.023311423,
-              0.021312106,
-              0.09513294,
-              0.08325624,
-              0.042880148,
-              0.0038685675,
-              0.037857197,
-              0.019852297,
-              -0.033418458,
-              0.10195742,
-              -0.014400936,
-              0.021739826,
-              -0.02148512,
-              -0.0074825305,
-              0.046198383,
-              0.06668454,
-              0.064343214,
-              -0.010934716,
-              0.016144961,
-              0.030755335,
-              0.017353602,
-              -0.07630945,
-              0.02787306,
-              0.053113766,
-              -0.061461076,
-              0.0071374113,
-              0.005771103,
-              0.05516302,
-              0.06909889,
-              -0.027851412,
-              -0.045708418,
-              0.09470951,
-              -0.029809639,
-              -0.0450938,
-              0.017276933,
-              0.016100975,
-              -0.06285931,
-              -0.045057483,
-              -0.045170058,
-              -0.005335317,
-              -0.019424338,
-              -0.04570747,
-              -0.026393251,
-              0.012418678,
-              0.08569869,
-              -0.0033635902,
-              0.0035900169,
-              -0.0119453,
-              0.00669384,
-              0.033529036,
-              -0.0011266738,
-              0.042164367,
-              0.055857047,
-              0.017889913,
-              0.07058827,
-              0.1045626,
-              0.06235585,
-              0.044550747,
-              -0.0027960828,
-              0.025605692,
-              -0.0020889128,
-              0.04055551,
-              -0.012159332,
-              0.05225918,
-              -0.0015176827,
-              0.053381234,
-              -0.007923704,
-              -0.028188763,
-              0.018261831,
-              -0.04613833,
-              -0.043358967,
-              -0.026370697,
-              -0.110958725,
-              0.008541168,
-              0.0056487373,
-              -0.034883622,
-              -0.05653664,
-              -0.030319579,
-              0.0053387904,
-              -0.08992194,
-              -0.0313816,
-              -0.06223965,
-              0.09973829,
-              -0.032821275,
-              -3.3483957e-33,
-              -0.027244257,
-              0.0105603505,
-              -0.022050971,
-              0.12673026,
-              0.031783704,
-              0.03317703,
-              -0.0515448,
-              -0.030908447,
-              -0.046472445,
-              -0.0022395607,
-              -0.056245685,
-              0.007864777,
-              0.06504396,
-              0.038899444,
-              -0.06833807,
-              0.07752775,
-              -0.0679177,
-              0.0064592003,
-              -0.04089174,
-              0.037315972,
-              -0.072344616,
-              0.0632527,
-              0.014409584,
-              -0.058710277,
-              0.030982593,
-              -0.019495374,
-              -0.07455309,
-              0.03753421,
-              -0.026329445,
-              0.020833284,
-              -0.031074857,
-              0.0059377784,
-              -0.047568988,
-              -0.010903666,
-              0.0353143,
-              0.054745093,
-              0.070084415,
-              -0.056538608,
-              -0.017365856,
-              0.07531329,
-              0.05383335,
-              0.0026772518,
-              -0.07281682,
-              -0.0755028,
-              -0.012854154,
-              0.011568236,
-              -0.08559846,
-              -0.0015188414,
-              0.036308214,
-              -0.062071785,
-              -0.0050686314,
-              0.023929637,
-              -0.008095938,
-              -0.03611622,
-              -0.034135558,
-              0.00030859755,
-              -0.057838384,
-              0.021293137,
-              0.056338087,
-              0.10234655,
-              -0.076837495,
-              -0.096356064,
-              0.029131278,
-              0.001004221,
-              -0.010381513,
-              0.055196848,
-              -0.021404155,
-              0.048181012,
-              -0.009104861,
-              0.0044043055,
-              0.002918874,
-              0.04924864,
-              -0.049854394,
-              0.0710729,
-              -0.048272487,
-              -0.07305892,
-              -0.026601639,
-              -0.06437188,
-              -0.034527853,
-              -0.005951345,
-              0.018712144,
-              -0.077793844,
-              -0.004720919,
-              0.045758806,
-              -0.04379248,
-              0.0121709565,
-              0.024249863,
-              0.03526606,
-              0.0062171146,
-              -0.08686959,
-              -0.014602414,
-              0.048708588,
-              -0.069689915,
-              0.04758633,
-              -0.096403375,
-              -3.885784e-08,
-              0.020160066,
-              -0.0060397363,
-              0.10671191,
-              -0.0073609953,
-              0.1113298,
-              0.07655439,
-              -0.08989872,
-              0.10998299,
-              -0.060445502,
-              -0.061076436,
-              0.046950154,
-              -0.016442984,
-              0.016685285,
-              -0.012291731,
-              0.0034336923,
-              0.031462166,
-              0.018294413,
-              0.037974738,
-              -0.00058906816,
-              0.0199562,
-              0.11084883,
-              -0.02309312,
-              0.04923742,
-              -0.04922855,
-              0.03767353,
-              -0.102210835,
-              0.0213937,
-              0.0049329796,
-              -0.026793618,
-              0.04147558,
-              -0.03789522,
-              0.029213108,
-              0.037435144,
-              -0.01592795,
-              0.095913775,
-              0.14336638,
-              0.049839716,
-              -0.112729535,
-              -0.06265318,
-              -0.03857694,
-              -0.03080216,
-              0.08552668,
-              -0.04825808,
-              0.04012672,
-              0.014288913,
-              -0.021062234,
-              0.048812427,
-              -0.05777949,
-              0.009785274,
-              0.0027342755,
-              0.07962631,
-              0.017954743,
-              0.022360845,
-              0.08985347,
-              0.066461965,
-              0.021893978,
-              0.059404697,
-              -0.061141845,
-              0.015304087,
-              0.08356255,
-              -0.0017417142,
-              0.08870375,
-              -0.027489252,
-              -0.060387574
+              -0.0012923438,
+              0.013419649,
+              0.03603258,
+              0.046982195,
+              -0.008386184,
+              -0.012245008,
+              0.017257063,
+              -0.014495833,
+              -0.06755615,
+              0.013220825,
+              -0.071046636,
+              0.022029007,
+              0.04805814,
+              -0.06659013,
+              -0.030023778,
+              0.014715108,
+              0.04294596,
+              0.031195298,
+              -0.06522679,
+              -0.07396746,
+              0.017329818,
+              -0.0151756415,
+              -0.052758723,
+              0.06344977,
+              0.005364444,
+              0.02631366,
+              0.03665044,
+              0.048812985,
+              -0.0044375616,
+              0.0103826355,
+              -0.0089511005,
+              -0.07216287,
+              0.05088121,
+              0.017377803,
+              -0.061182447,
+              -0.010244597,
+              -0.06587784,
+              0.069840916,
+              0.028359821,
+              -0.037131228,
+              -0.052071016,
+              -0.07370394,
+              0.0233667,
+              -0.02532014,
+              0.06171828,
+              0.11584273,
+              -0.08307468,
+              -0.08872316,
+              -0.04554565,
+              0.02177065,
+              -0.12324151,
+              -0.023568366,
+              -0.0015541487,
+              -0.013532973,
+              -0.056209136,
+              0.0880576,
+              0.03321554,
+              0.05171784,
+              0.0074756956,
+              -0.025275769,
+              0.023162214,
+              -0.15517598,
+              -0.010777206,
+              0.016303454,
+              0.034188252,
+              0.020134093,
+              -0.022240352,
+              0.050957076,
+              -0.005396301,
+              -0.04007687,
+              -0.020301744,
+              0.10113998,
+              0.002977471,
+              0.06617704,
+              0.040134214,
+              -0.02005319,
+              -0.059682623,
+              -0.06369068,
+              0.08473604,
+              0.023557685,
+              -0.017191878,
+              -0.005820709,
+              -0.026404407,
+              0.09280466,
+              0.04844145,
+              -0.06875489,
+              -0.022161635,
+              -0.015402431,
+              -0.0111024445,
+              -0.017707076,
+              0.025355583,
+              -0.039296508,
+              -0.001362202,
+              -0.040884525,
+              -0.03204941,
+              0.04150212,
+              0.008948646,
+              -0.13776794,
+              0.030302526,
+              0.058231197,
+              0.010572606,
+              0.09247389,
+              -0.035872795,
+              -0.0036602807,
+              0.056347203,
+              -0.003996722,
+              0.035537403,
+              0.014696888,
+              0.10615937,
+              -0.13590123,
+              -0.05810754,
+              0.04527657,
+              -0.06982519,
+              -0.049982276,
+              -0.041045085,
+              0.01247287,
+              -0.040934183,
+              0.028955987,
+              -0.02226216,
+              0.08722953,
+              -0.009548719,
+              -0.025511682,
+              0.0114325285,
+              0.03363939,
+              0.021809513,
+              -0.08675585,
+              -0.07089411,
+              1.7909231e-33,
+              -0.04121751,
+              -0.1001688,
+              0.006345352,
+              0.0037210584,
+              0.029166285,
+              -0.0872215,
+              -0.04271259,
+              -0.06566409,
+              0.017946582,
+              0.022238955,
+              -0.03249184,
+              -0.02349789,
+              0.021466883,
+              0.09511927,
+              0.08346572,
+              0.042806614,
+              0.0038908664,
+              0.037915263,
+              0.020043708,
+              -0.033399176,
+              0.10208849,
+              -0.014397545,
+              0.021684645,
+              -0.021582458,
+              -0.0074115414,
+              0.046073515,
+              0.06664795,
+              0.06434497,
+              -0.010910654,
+              0.016172478,
+              0.030913299,
+              0.017434347,
+              -0.0762684,
+              0.027927354,
+              0.053165767,
+              -0.061656844,
+              0.007082498,
+              0.0057526245,
+              0.055203717,
+              0.069314696,
+              -0.027693065,
+              -0.045786254,
+              0.094618365,
+              -0.02984729,
+              -0.045069296,
+              0.01723317,
+              0.016129777,
+              -0.06281533,
+              -0.045081936,
+              -0.045089465,
+              -0.0053253355,
+              -0.019320533,
+              -0.045810748,
+              -0.02639149,
+              0.012412514,
+              0.08566385,
+              -0.0034776065,
+              0.0035142878,
+              -0.012017715,
+              0.006649936,
+              0.033606175,
+              -0.0012646043,
+              0.042252455,
+              0.055928096,
+              0.017948387,
+              0.07064788,
+              0.10451079,
+              0.062350754,
+              0.04458121,
+              -0.0028225682,
+              0.02566386,
+              -0.0021405003,
+              0.040477417,
+              -0.012259745,
+              0.052335545,
+              -0.0017080541,
+              0.05346329,
+              -0.007733562,
+              -0.028276777,
+              0.018282998,
+              -0.046343774,
+              -0.043290336,
+              -0.026471136,
+              -0.11104024,
+              0.008576623,
+              0.005548108,
+              -0.034847535,
+              -0.056416124,
+              -0.030293388,
+              0.0053394907,
+              -0.09004081,
+              -0.03141982,
+              -0.062330373,
+              0.09981983,
+              -0.032840475,
+              -3.3540373e-33,
+              -0.027300175,
+              0.010525057,
+              -0.021980286,
+              0.12664026,
+              0.031588834,
+              0.033247624,
+              -0.05148502,
+              -0.03101089,
+              -0.0465964,
+              -0.0022529345,
+              -0.056195565,
+              0.007953736,
+              0.064945616,
+              0.03884713,
+              -0.06837888,
+              0.077476665,
+              -0.06788635,
+              0.0064428714,
+              -0.040736765,
+              0.037416343,
+              -0.07232494,
+              0.063321635,
+              0.014398016,
+              -0.05871896,
+              0.031005096,
+              -0.019561818,
+              -0.07452502,
+              0.037396118,
+              -0.026255993,
+              0.020780139,
+              -0.031075457,
+              0.0058948854,
+              -0.047562398,
+              -0.010866235,
+              0.0352409,
+              0.0549852,
+              0.07012556,
+              -0.056673322,
+              -0.017415406,
+              0.07528239,
+              0.05387259,
+              0.0028653517,
+              -0.07284915,
+              -0.07543174,
+              -0.012900278,
+              0.011457189,
+              -0.08563738,
+              -0.0015463261,
+              0.036361244,
+              -0.062004283,
+              -0.0050084046,
+              0.023846988,
+              -0.008083734,
+              -0.03593437,
+              -0.034260865,
+              0.000298229,
+              -0.0578704,
+              0.021156322,
+              0.056237947,
+              0.102285825,
+              -0.07694436,
+              -0.096381366,
+              0.029115336,
+              0.001019501,
+              -0.010235284,
+              0.055199094,
+              -0.021333022,
+              0.04801045,
+              -0.008948923,
+              0.0043332377,
+              0.002985581,
+              0.049172573,
+              -0.049805593,
+              0.07117998,
+              -0.04823976,
+              -0.072981454,
+              -0.026498413,
+              -0.06437876,
+              -0.0346269,
+              -0.0060303714,
+              0.018713593,
+              -0.07784192,
+              -0.0046854415,
+              0.04578587,
+              -0.043880597,
+              0.012154217,
+              0.024205454,
+              0.0352363,
+              0.0063410155,
+              -0.086736806,
+              -0.014489626,
+              0.048670504,
+              -0.06944819,
+              0.047556538,
+              -0.096405424,
+              -3.8881783e-08,
+              0.020024363,
+              -0.0060733794,
+              0.10675529,
+              -0.0072445725,
+              0.11130468,
+              0.0766799,
+              -0.089739904,
+              0.10989663,
+              -0.060538583,
+              -0.061066266,
+              0.046883732,
+              -0.016365182,
+              0.016547771,
+              -0.012390388,
+              0.0035057077,
+              0.031388927,
+              0.018324051,
+              0.038030062,
+              -0.0005554988,
+              0.019816065,
+              0.110884875,
+              -0.023082083,
+              0.049298774,
+              -0.049228016,
+              0.03771876,
+              -0.10209589,
+              0.021328293,
+              0.0048561115,
+              -0.026669646,
+              0.04161308,
+              -0.037887473,
+              0.029118432,
+              0.03738528,
+              -0.015714107,
+              0.0959638,
+              0.1434109,
+              0.049922757,
+              -0.11274395,
+              -0.06264596,
+              -0.038560014,
+              -0.03071335,
+              0.08555022,
+              -0.048136428,
+              0.0401538,
+              0.014374478,
+              -0.021280114,
+              0.04872567,
+              -0.057720494,
+              0.009963986,
+              0.002822142,
+              0.079809405,
+              0.017903175,
+              0.022365756,
+              0.08987974,
+              0.06651197,
+              0.022014199,
+              0.059419304,
+              -0.06117766,
+              0.015350715,
+              0.08376493,
+              -0.0017018274,
+              0.08864588,
+              -0.027652979,
+              -0.060420066
             ],
             "index": 1,
             "object": "embedding"
           },
           {
             "embedding": [
-              -0.01909185,
-              0.08210908,
-              -0.031697396,
-              -0.037725717,
-              -0.013948411,
-              -0.15075137,
-              -0.054330785,
-              0.013774222,
-              0.022384442,
-              0.025810372,
-              -0.018899407,
-              0.016055057,
-              0.04682177,
-              -0.009026702,
-              0.042360768,
-              0.015625892,
-              -0.08302362,
-              0.01837326,
-              -0.016616724,
-              -0.032981716,
-              -0.021160135,
-              -0.04206737,
-              -0.10867114,
-              0.019524219,
-              -0.0218146,
-              0.14237456,
-              -0.0013471643,
-              -0.058096632,
-              0.005461365,
-              -0.03999384,
-              0.012291773,
-              -0.014425554,
-              0.10419223,
-              0.0867777,
-              -0.07383953,
-              0.031295475,
-              0.077625275,
-              -0.041881,
-              -0.092624,
-              0.01998734,
-              -0.095912896,
-              0.063472316,
-              0.003484427,
-              0.038539667,
-              -0.022530979,
-              0.04934113,
-              -0.026355578,
-              -0.049568307,
-              -0.013252214,
-              0.012179733,
-              -0.11694328,
-              0.045149647,
-              -0.029160414,
-              0.025387803,
-              0.042368047,
-              0.070710085,
-              0.070657425,
-              0.0035213856,
-              -0.06036566,
-              0.042079538,
-              0.016191904,
-              -0.07189093,
-              0.01456738,
-              -0.0062431092,
-              0.029964449,
-              0.04743292,
-              0.011312341,
-              0.013767268,
-              0.0437025,
-              -0.021806497,
-              0.022327632,
-              0.047793407,
-              -0.040208474,
-              0.09488345,
-              0.031709157,
-              0.013329832,
-              -0.039763663,
-              -0.021771243,
-              0.028142115,
-              -0.034374766,
-              0.019633956,
-              0.04357714,
-              -0.042946506,
-              0.054137547,
-              0.02298205,
-              -0.056623355,
-              0.016670695,
-              -0.026936218,
-              -0.039648514,
-              0.022648802,
-              0.074515395,
-              -0.014122732,
-              -0.008389847,
-              0.008296867,
-              -0.024172261,
-              -0.020115776,
-              0.024380524,
-              -0.025786858,
-              0.103464104,
-              -0.016478091,
-              0.052223783,
-              0.043333497,
-              0.024358233,
-              0.016022986,
-              -0.05042404,
-              -0.11150191,
-              0.05203884,
-              -0.017846802,
-              -0.037723143,
-              -0.06778183,
-              -0.016054656,
-              0.052769117,
-              -0.08858154,
-              -0.085411474,
-              -0.07678483,
-              -0.093204886,
-              -0.12648286,
-              0.0137771405,
-              -0.0304395,
-              0.009822453,
-              0.03967907,
-              -0.019339666,
-              -0.028843539,
-              0.008771393,
-              0.017766763,
-              -0.117280774,
-              -0.12130908,
-              1.3469411e-33,
-              -0.035681557,
-              -0.023190562,
-              -0.017074129,
-              -1.6205338e-05,
-              0.007204496,
-              -0.029650006,
-              0.022068633,
-              -0.010598994,
-              -0.069006644,
-              0.04264849,
-              -0.034409285,
-              0.041181736,
-              0.017070102,
-              0.038193207,
-              0.13750355,
-              -0.008732008,
-              -0.0023180074,
-              0.083727285,
-              -0.024649868,
-              -0.028474895,
-              0.09694714,
-              -0.021191066,
-              0.06053226,
-              -0.041405093,
-              0.07370928,
-              0.01850027,
-              -0.01971475,
-              0.007999736,
-              -0.012563452,
-              -0.0052131964,
-              -0.020111304,
-              -0.011468107,
-              0.0026756013,
-              0.036281988,
-              0.12377738,
-              0.02956046,
-              0.026860835,
-              -0.06579819,
-              0.02606916,
-              -0.062286723,
-              0.03685007,
-              0.030303163,
-              0.034121655,
-              0.035232946,
-              -0.06362426,
-              -0.016618941,
-              -0.020203734,
-              -0.007140921,
-              0.004051276,
-              -0.07790596,
-              0.06898834,
-              0.012174228,
-              0.02399248,
-              0.07704281,
-              0.027410457,
-              0.03527179,
-              -0.045968123,
-              -0.061433975,
-              -0.026718443,
-              0.08237309,
-              -0.06257907,
-              0.009975696,
-              0.03466846,
-              0.023707619,
-              -0.005923376,
-              0.021586487,
-              -0.026310347,
-              -0.021010567,
-              0.113740906,
-              0.03669437,
-              -0.008125993,
-              0.0025199307,
-              -0.032581042,
-              0.013843451,
-              -0.018476631,
-              -0.006003686,
-              -0.012653546,
-              -0.049709707,
-              -0.048699785,
-              0.027735613,
-              -0.08145447,
-              0.012676274,
-              0.045807578,
-              0.013233746,
-              0.002309172,
-              -0.05062278,
-              0.041730475,
-              -0.015777566,
-              -0.07134252,
-              -0.01638618,
-              -0.018929252,
-              -0.0037979293,
-              0.033871777,
-              -0.009268418,
-              0.0058128047,
-              -4.559954e-33,
-              0.023730619,
-              -0.024401154,
-              -0.00841481,
-              -0.00066814705,
-              -0.021580337,
-              0.012711025,
-              -0.025765585,
-              -0.103677936,
-              -0.040020734,
-              0.011981005,
-              -0.015193463,
-              0.020232921,
-              0.04560608,
-              -0.070537254,
-              0.03442731,
-              0.056372125,
-              -0.015020648,
-              -0.084235705,
-              -0.049507406,
-              -0.038237974,
-              -0.0559059,
-              0.04445899,
-              -0.0019443573,
-              -0.07633201,
-              0.03479357,
-              -0.042617764,
-              -0.07321345,
-              -0.08922806,
-              0.08394847,
-              0.03421326,
-              -0.055690773,
-              -0.017199906,
-              -0.0023083915,
-              -0.01934703,
-              0.034031216,
-              -0.006698058,
-              0.070640974,
-              -0.01372546,
-              0.03538893,
-              -0.011788179,
-              -0.011852313,
-              0.08166145,
-              0.011479538,
-              -0.049201284,
-              0.04615006,
-              0.029843343,
-              -0.03588677,
-              0.13095836,
-              -0.072135866,
-              -0.053584475,
-              0.047869757,
-              -0.03287441,
-              0.03326261,
-              -0.053389616,
-              0.11908374,
-              -0.013321548,
-              -0.08042228,
-              0.018044744,
-              0.028799541,
-              0.012628236,
-              -0.08251972,
-              -0.079905055,
-              0.036529243,
-              0.048085902,
-              -0.045983046,
-              -0.03986574,
-              -0.019302275,
-              -0.11115848,
-              -0.12231937,
-              -0.08230352,
-              0.014421084,
-              0.04155652,
-              -0.054012556,
-              0.120470405,
-              -0.1052826,
-              -0.033725824,
-              -0.04631211,
-              0.015635889,
-              0.031605463,
-              0.08958995,
-              0.06221735,
-              0.023502862,
-              0.013489683,
-              0.043624874,
-              0.017064072,
-              0.030997539,
-              0.052865345,
-              -0.056004714,
-              0.015898803,
-              -0.043719135,
-              -0.039004944,
-              -0.020523861,
-              -0.01858906,
-              0.08363329,
-              -0.017366229,
-              -3.8721744e-08,
-              -0.05206802,
-              -0.09438689,
-              0.009355713,
-              -0.024583869,
-              0.045587633,
-              0.0018443449,
-              -0.01947225,
-              0.14300145,
-              -0.0009495537,
-              -0.01863899,
-              0.060845647,
-              -0.022184245,
-              -0.06662406,
-              -0.042786483,
-              0.07611814,
-              0.0522471,
-              0.08175813,
-              -0.13221133,
-              0.015135053,
-              0.07540032,
-              0.016381217,
-              0.0029628049,
-              -0.06187796,
-              0.0788501,
-              0.041752115,
-              -0.043685306,
-              0.05732324,
-              0.013885361,
-              -0.015759919,
-              0.002782697,
-              -0.002972652,
-              -0.027957972,
-              0.03508128,
-              0.073690735,
-              0.115438506,
-              0.007924459,
-              0.054716144,
-              0.07080589,
-              -0.04037572,
-              -0.07577974,
-              0.015341726,
-              -0.014179411,
-              -0.03881855,
-              0.029368779,
-              0.061343305,
-              0.025503315,
-              -0.039556272,
-              0.113217,
-              -0.028291667,
-              0.032105908,
-              -0.038683154,
-              0.02992647,
-              -0.02093155,
-              -0.0045508672,
-              -0.06038734,
-              0.010602616,
-              -0.0069765793,
-              -0.04628652,
-              0.040670633,
-              0.039827973,
-              -0.015934473,
-              0.025722258,
-              0.035333917,
-              -0.026775397
+              -0.019089537,
+              0.08206227,
+              -0.031629756,
+              -0.037748322,
+              -0.013907723,
+              -0.15086435,
+              -0.054227855,
+              0.013812081,
+              0.022318492,
+              0.025760967,
+              -0.018970305,
+              0.0159997,
+              0.046886247,
+              -0.008989786,
+              0.042260803,
+              0.01563633,
+              -0.08306234,
+              0.018418225,
+              -0.016524842,
+              -0.033054315,
+              -0.021094276,
+              -0.04198475,
+              -0.108629815,
+              0.019558346,
+              -0.021839257,
+              0.14248955,
+              -0.0012803682,
+              -0.058087774,
+              0.005395786,
+              -0.040014874,
+              0.012412929,
+              -0.014448109,
+              0.10412988,
+              0.08678136,
+              -0.07392144,
+              0.031378184,
+              0.077501394,
+              -0.04197698,
+              -0.092644565,
+              0.019878637,
+              -0.09584833,
+              0.06355258,
+              0.0034316017,
+              0.03860985,
+              -0.022438047,
+              0.04932071,
+              -0.026379092,
+              -0.049524873,
+              -0.013308545,
+              0.012192514,
+              -0.11695286,
+              0.04510036,
+              -0.029017858,
+              0.025516428,
+              0.04245081,
+              0.070753604,
+              0.07057494,
+              0.003524953,
+              -0.06010962,
+              0.041959174,
+              0.016197778,
+              -0.07186037,
+              0.014555853,
+              -0.006213116,
+              0.030063417,
+              0.047432736,
+              0.011306432,
+              0.013843393,
+              0.0436187,
+              -0.021850524,
+              0.022346757,
+              0.047835413,
+              -0.04025223,
+              0.09492459,
+              0.03155159,
+              0.013348888,
+              -0.039819352,
+              -0.021837216,
+              0.028181475,
+              -0.03434981,
+              0.019666592,
+              0.043579087,
+              -0.042940862,
+              0.054164745,
+              0.02308801,
+              -0.056740467,
+              0.016757911,
+              -0.02701336,
+              -0.039681926,
+              0.022773864,
+              0.074453875,
+              -0.01407503,
+              -0.008249863,
+              0.008273288,
+              -0.024091411,
+              -0.020071099,
+              0.024399305,
+              -0.025779521,
+              0.1035294,
+              -0.016452465,
+              0.05220051,
+              0.043400586,
+              0.024392875,
+              0.0160118,
+              -0.050395392,
+              -0.11149879,
+              0.05203916,
+              -0.017942373,
+              -0.03793447,
+              -0.06775703,
+              -0.01611577,
+              0.05274979,
+              -0.08863033,
+              -0.085470706,
+              -0.076794446,
+              -0.09332248,
+              -0.1264284,
+              0.013839316,
+              -0.030490262,
+              0.009920159,
+              0.03968685,
+              -0.01939706,
+              -0.028892461,
+              0.008741198,
+              0.017886965,
+              -0.117217556,
+              -0.1212998,
+              1.35733635e-33,
+              -0.035622492,
+              -0.023267707,
+              -0.017018162,
+              0.00010073695,
+              0.007257954,
+              -0.029587401,
+              0.022087794,
+              -0.010561547,
+              -0.06912062,
+              0.04277785,
+              -0.034413584,
+              0.041110493,
+              0.017055655,
+              0.038174715,
+              0.13757399,
+              -0.008806284,
+              -0.0023235404,
+              0.08372674,
+              -0.024748268,
+              -0.028528849,
+              0.096861266,
+              -0.02111509,
+              0.06039901,
+              -0.041284908,
+              0.07366366,
+              0.018533891,
+              -0.019621244,
+              0.00789655,
+              -0.012412154,
+              -0.005184189,
+              -0.0202234,
+              -0.011487718,
+              0.0026882978,
+              0.036282968,
+              0.12384692,
+              0.029563135,
+              0.02673901,
+              -0.06578298,
+              0.02610267,
+              -0.062275145,
+              0.036926493,
+              0.030272253,
+              0.034105044,
+              0.03516919,
+              -0.06365454,
+              -0.016557874,
+              -0.020214476,
+              -0.007219471,
+              0.004009068,
+              -0.07774858,
+              0.06894675,
+              0.012156706,
+              0.024095584,
+              0.07716194,
+              0.027376112,
+              0.03524163,
+              -0.046042208,
+              -0.061379924,
+              -0.026633548,
+              0.08248479,
+              -0.06261388,
+              0.009910456,
+              0.034668844,
+              0.023772387,
+              -0.005869554,
+              0.02162769,
+              -0.026385942,
+              -0.02100117,
+              0.11375441,
+              0.03666832,
+              -0.008121711,
+              0.0026215075,
+              -0.032531988,
+              0.01391055,
+              -0.018540533,
+              -0.0059300573,
+              -0.012669122,
+              -0.04971856,
+              -0.048864197,
+              0.027610987,
+              -0.08137648,
+              0.012624587,
+              0.045806322,
+              0.01336533,
+              0.002328637,
+              -0.050664812,
+              0.041695803,
+              -0.015773693,
+              -0.07136885,
+              -0.016258836,
+              -0.018871423,
+              -0.0038626953,
+              0.03402061,
+              -0.009335479,
+              0.005747506,
+              -4.5611018e-33,
+              0.023689948,
+              -0.02445775,
+              -0.00834689,
+              -0.00063168275,
+              -0.021578811,
+              0.012567475,
+              -0.025760869,
+              -0.10368349,
+              -0.03997725,
+              0.01210385,
+              -0.015231519,
+              0.02017564,
+              0.045654193,
+              -0.07050829,
+              0.034459736,
+              0.056491707,
+              -0.014989821,
+              -0.08433123,
+              -0.049400527,
+              -0.03832157,
+              -0.055948768,
+              0.044390477,
+              -0.001941214,
+              -0.0763155,
+              0.034730915,
+              -0.04243297,
+              -0.07322386,
+              -0.08912488,
+              0.083965875,
+              0.034240186,
+              -0.055734336,
+              -0.017151177,
+              -0.0023456868,
+              -0.019274496,
+              0.03401833,
+              -0.006712739,
+              0.070724845,
+              -0.013663151,
+              0.035358265,
+              -0.011840785,
+              -0.011920096,
+              0.081632204,
+              0.011438198,
+              -0.04905726,
+              0.04624871,
+              0.029794158,
+              -0.035954632,
+              0.1309978,
+              -0.0722,
+              -0.053626865,
+              0.047662914,
+              -0.032893717,
+              0.03320312,
+              -0.053293463,
+              0.11909418,
+              -0.013308413,
+              -0.08026765,
+              0.018056376,
+              0.028816566,
+              0.012597203,
+              -0.082487956,
+              -0.07992265,
+              0.03653938,
+              0.048042614,
+              -0.04597376,
+              -0.039927375,
+              -0.019282784,
+              -0.11115308,
+              -0.12229221,
+              -0.08222088,
+              0.014523922,
+              0.041549023,
+              -0.054067343,
+              0.12032739,
+              -0.10513437,
+              -0.03352011,
+              -0.046141136,
+              0.015660388,
+              0.03162219,
+              0.089564346,
+              0.06229127,
+              0.02344754,
+              0.013432015,
+              0.04364802,
+              0.017062847,
+              0.030911682,
+              0.052861545,
+              -0.05597565,
+              0.015810143,
+              -0.04374839,
+              -0.039106574,
+              -0.020592151,
+              -0.01868341,
+              0.08352379,
+              -0.017375095,
+              -3.8713683e-08,
+              -0.052152414,
+              -0.09442023,
+              0.009305927,
+              -0.024598995,
+              0.04574071,
+              0.0017779457,
+              -0.019384999,
+              0.14307584,
+              -0.00092140987,
+              -0.018639628,
+              0.06094085,
+              -0.022180414,
+              -0.06670714,
+              -0.042788457,
+              0.07614433,
+              0.052368972,
+              0.08171796,
+              -0.13214965,
+              0.015069824,
+              0.07545052,
+              0.016364794,
+              0.0030805927,
+              -0.06188439,
+              0.07879054,
+              0.04179921,
+              -0.043787137,
+              0.05729686,
+              0.013950966,
+              -0.01580636,
+              0.002741003,
+              -0.002896178,
+              -0.027976623,
+              0.0352471,
+              0.07360851,
+              0.11537727,
+              0.008016604,
+              0.054790642,
+              0.070841216,
+              -0.040544577,
+              -0.07585315,
+              0.015317468,
+              -0.014144724,
+              -0.03884744,
+              0.029432015,
+              0.061295677,
+              0.025552604,
+              -0.03950773,
+              0.1131327,
+              -0.028318027,
+              0.031907115,
+              -0.038748857,
+              0.029967804,
+              -0.020923622,
+              -0.0045868345,
+              -0.060423743,
+              0.01062511,
+              -0.006921613,
+              -0.046255972,
+              0.04074385,
+              0.039824147,
+              -0.016014125,
+              0.025676023,
+              0.03524506,
+              -0.0267346
             ],
             "index": 2,
             "object": "embedding"
           },
           {
             "embedding": [
-              -0.053183872,
-              -0.047788426,
-              0.04972303,
-              -0.009334505,
-              -0.056231733,
-              -0.037002083,
-              0.015224726,
-              0.0033988354,
-              0.04447645,
-              0.016588705,
-              -0.06540302,
-              0.04653401,
-              0.012623523,
-              0.025223762,
-              -0.11425605,
-              0.027273744,
-              -0.052391008,
-              0.06020533,
-              -0.045948613,
-              -0.022937857,
-              0.016519869,
-              0.014322256,
-              -0.07750287,
-              0.016460732,
-              -0.06725244,
-              0.120790765,
-              -0.0022636163,
-              -0.0005024785,
-              0.031048942,
-              0.031126363,
-              0.105009794,
-              -0.06930837,
-              -0.013206138,
-              0.028933082,
-              -0.08795337,
-              0.05555298,
-              -0.09165988,
-              -0.018175907,
-              -0.024678476,
-              -0.020182805,
-              0.013178067,
-              -0.0007228829,
-              0.0018159959,
-              0.006769804,
-              0.0860061,
-              0.06185969,
-              -0.077463284,
-              -0.047084846,
-              -0.0498773,
-              -0.008899272,
-              -0.08812909,
-              0.00094635173,
-              -0.014987473,
-              -0.007606875,
-              0.08516766,
-              0.059840705,
-              0.024647623,
-              0.03781936,
-              -0.051698226,
-              0.03140343,
-              0.113696024,
-              -0.044227768,
-              0.009882869,
-              0.006037432,
-              0.030196855,
-              0.071224906,
-              -0.013819336,
-              0.036284678,
-              0.0047479654,
-              -0.074841194,
-              0.09735655,
-              0.0715865,
-              -0.009209204,
-              -0.009545715,
-              0.042258147,
-              0.01176989,
-              0.032883737,
-              0.01871987,
-              0.012600867,
-              -0.009270322,
-              -0.03493854,
-              0.0165816,
-              0.005335793,
-              0.03813737,
-              0.09589841,
-              -0.0021022737,
-              -0.020831643,
-              0.018148199,
-              -0.032354474,
-              0.012446273,
-              -0.014385681,
-              -0.0669802,
-              -0.095483646,
-              -0.10348357,
-              -0.0010490393,
-              -0.0031702255,
-              0.027040303,
-              -0.033902746,
-              0.0011530715,
-              -0.009055597,
-              -0.048646227,
-              0.002960075,
-              -0.04150261,
-              -0.03958488,
-              0.07510442,
-              0.031126844,
-              0.030005287,
-              0.03351958,
-              0.11425093,
-              -0.08292283,
-              -0.10923656,
-              0.03011645,
-              -0.041837137,
-              0.042389642,
-              0.03338184,
-              -0.038825653,
-              0.02099903,
-              0.02824791,
-              0.054426163,
-              0.09631318,
-              -0.0034680578,
-              -0.015158154,
-              -0.09265031,
-              -0.056172263,
-              -0.0032930053,
-              -0.029391458,
-              -0.11419404,
-              1.5047121e-33,
-              -0.045322943,
-              -0.073544085,
-              0.034601163,
-              -0.067317046,
-              0.023250451,
-              -0.050395396,
-              -0.01739104,
-              -0.0057262457,
-              0.05205013,
-              -0.018088019,
-              -0.10174609,
-              0.016569315,
-              -0.005840307,
-              0.08825027,
-              0.04746817,
-              -0.06267444,
-              -0.037124775,
-              -0.04898983,
-              0.061778635,
-              -0.11774465,
-              0.015096424,
-              -0.071004175,
-              0.073210604,
-              -0.01007678,
-              -0.004525406,
-              0.0014324179,
-              0.012293256,
-              -0.018664367,
-              0.019014336,
-              -0.007747823,
-              -0.008599073,
-              0.023763629,
-              -0.0075268243,
-              -0.04203368,
-              -0.008033764,
-              -0.009042761,
-              0.11055124,
-              -0.02855999,
-              0.03761048,
-              0.047079824,
-              0.06257789,
-              -0.049527515,
-              0.06296901,
-              0.005405868,
-              0.024098972,
-              0.03435228,
-              -0.01710498,
-              -0.03391623,
-              0.012577585,
-              -0.05742578,
-              -0.04634173,
-              -0.00025635032,
-              0.022637868,
-              -0.11001833,
-              0.09246783,
-              0.049007315,
-              -0.04402184,
-              0.054414723,
-              -0.0058709052,
-              0.04826815,
-              0.035579093,
-              -0.015419815,
-              -0.008092566,
-              0.09276399,
-              0.11231051,
-              0.04793964,
-              -0.01756467,
-              -0.009571233,
-              0.062215857,
-              -0.003897838,
-              0.0039975815,
-              0.09544971,
-              -0.05662297,
-              -0.058832105,
-              -0.013788285,
-              0.009673877,
-              -0.047247868,
-              -0.06171914,
-              -0.08586089,
-              0.050003,
-              -0.027761148,
-              -0.007729704,
-              -0.068465404,
-              0.03243531,
-              0.015467505,
-              0.08288645,
-              0.063559495,
-              -0.005212987,
-              -0.011866209,
-              -0.051806632,
-              -0.008613721,
-              -0.031797357,
-              0.04311073,
-              0.00030667474,
-              -0.0012307463,
-              -2.3338469e-33,
-              -0.084895805,
-              0.02345889,
-              -0.055576142,
-              0.028851906,
-              0.059744447,
-              0.044220533,
-              -0.06970062,
-              -0.08749075,
-              -0.023501378,
-              0.07671297,
-              0.015147405,
-              0.019593416,
-              -0.05839991,
-              0.018738003,
-              0.0077306163,
-              -0.016015125,
-              -0.057336047,
-              -0.042650495,
-              0.100997806,
-              -0.04004008,
-              -0.031775918,
-              0.031698614,
-              -0.057948347,
-              -0.036700245,
-              0.027361931,
-              -0.007076578,
-              -0.07529461,
-              0.049506873,
-              0.012840347,
-              0.1000292,
-              -0.036281507,
-              -0.04813614,
-              0.029130226,
-              0.017983682,
-              0.045438614,
-              0.10252733,
-              0.00496251,
-              -0.055316452,
-              0.008405219,
-              -0.05972534,
-              0.020135194,
-              0.0093700085,
-              -0.06655473,
-              -0.029796828,
-              0.043222178,
-              -0.06824294,
-              -0.07651206,
-              0.03997172,
-              -0.06478741,
-              0.072208196,
-              0.046655826,
-              -0.016924199,
-              -0.048682548,
-              -0.08449499,
-              -0.05253414,
-              0.032000206,
-              0.024684923,
-              0.023903653,
-              0.07640757,
-              -0.04118769,
-              -0.03387857,
-              -0.114066795,
-              0.06797275,
-              0.009583203,
-              -0.06417275,
-              0.02440743,
-              0.025039174,
-              -0.004076159,
-              0.018739574,
-              -0.038113788,
-              0.014584011,
-              0.06845566,
-              0.018653333,
-              0.05947389,
-              0.02376919,
-              -0.009693411,
-              -0.066522814,
-              0.020966992,
-              -0.01941947,
-              0.014822965,
-              0.022724027,
-              -0.022646833,
-              0.010568073,
-              0.056872703,
-              0.07259132,
-              0.06503742,
-              -0.010027183,
-              0.079110056,
-              0.03518498,
-              -0.023728298,
-              0.017138498,
-              0.08788164,
-              0.0060143326,
-              0.0074335723,
-              -0.1092527,
-              -2.8781574e-08,
-              -0.05242197,
-              -0.087604366,
-              0.06664988,
-              0.014051439,
-              0.0998947,
-              -0.022531891,
-              0.062183738,
-              0.027777275,
-              -0.064255044,
-              -0.03866553,
-              0.024992257,
-              0.007985698,
-              -0.024069482,
-              0.012068325,
-              0.087151505,
-              0.012454641,
-              0.06475363,
-              -0.027938146,
-              0.03995433,
-              -0.01226524,
-              0.023152042,
-              -0.032571565,
-              -0.04254354,
-              0.10729923,
-              0.037443064,
-              -0.06624038,
-              -0.05680355,
-              -0.005158616,
-              -0.069514066,
-              0.10108567,
-              -0.03336937,
-              0.02180458,
-              0.017406454,
-              0.018036628,
-              0.026380124,
-              0.06607102,
-              0.059448373,
-              -0.06540129,
-              -0.11567981,
-              -0.07119791,
-              -0.023404302,
-              0.04258733,
-              0.04359592,
-              -0.03663909,
-              0.050169207,
-              0.0029874544,
-              0.05701757,
-              -0.034646694,
-              0.025559898,
-              -0.046218865,
-              -0.06721346,
-              0.060566954,
-              -0.041338935,
-              -0.019814374,
-              -0.013770683,
-              -0.061239764,
-              0.01488027,
-              -0.07664038,
-              -0.05666399,
-              0.050506476,
-              -0.0359506,
-              0.12227603,
-              0.06429049,
-              -0.038193453
+              -0.053171553,
+              -0.047855794,
+              0.04959839,
+              -0.009352584,
+              -0.056259144,
+              -0.036997948,
+              0.01525368,
+              0.0033788579,
+              0.04453428,
+              0.016438372,
+              -0.065293424,
+              0.04655176,
+              0.012637792,
+              0.025149647,
+              -0.11436081,
+              0.027283441,
+              -0.052422393,
+              0.060236752,
+              -0.046064522,
+              -0.022863738,
+              0.016536511,
+              0.014447978,
+              -0.07744467,
+              0.016475804,
+              -0.067145765,
+              0.120901324,
+              -0.0022643541,
+              -0.0005619333,
+              0.03098974,
+              0.03116176,
+              0.10501578,
+              -0.06940328,
+              -0.013246061,
+              0.029016647,
+              -0.08779694,
+              0.055636257,
+              -0.09158273,
+              -0.018188708,
+              -0.024831342,
+              -0.020263424,
+              0.013102336,
+              -0.0007477728,
+              0.0018712403,
+              0.0068353964,
+              0.08601601,
+              0.061896168,
+              -0.07733195,
+              -0.047134392,
+              -0.04994557,
+              -0.008955441,
+              -0.08808325,
+              0.0011078792,
+              -0.015078675,
+              -0.007628681,
+              0.08530312,
+              0.059783977,
+              0.024557464,
+              0.037825108,
+              -0.05171798,
+              0.03148071,
+              0.11377193,
+              -0.04417297,
+              0.009659848,
+              0.0060449084,
+              0.030134702,
+              0.07118153,
+              -0.013864897,
+              0.03624278,
+              0.0049465275,
+              -0.07480586,
+              0.09733932,
+              0.071613275,
+              -0.009146446,
+              -0.009571701,
+              0.042258315,
+              0.011740325,
+              0.032803785,
+              0.018631615,
+              0.012556345,
+              -0.009346388,
+              -0.03489368,
+              0.01649207,
+              0.005488214,
+              0.03819102,
+              0.09597803,
+              -0.002047146,
+              -0.020768773,
+              0.018077927,
+              -0.032444023,
+              0.012474241,
+              -0.014445184,
+              -0.0670006,
+              -0.095488854,
+              -0.10345397,
+              -0.0009862595,
+              -0.0030658073,
+              0.027003448,
+              -0.033961065,
+              0.0011482734,
+              -0.009025799,
+              -0.048620287,
+              0.0029769312,
+              -0.04154341,
+              -0.0395945,
+              0.07520094,
+              0.031153427,
+              0.030031031,
+              0.03353441,
+              0.11403943,
+              -0.082912125,
+              -0.109138384,
+              0.030059446,
+              -0.041853014,
+              0.042241115,
+              0.033335667,
+              -0.038876496,
+              0.02092849,
+              0.028346559,
+              0.054482125,
+              0.09627962,
+              -0.0035115955,
+              -0.015083763,
+              -0.092599295,
+              -0.056257337,
+              -0.00332258,
+              -0.02934002,
+              -0.11417531,
+              1.5075675e-33,
+              -0.04527847,
+              -0.07345357,
+              0.034714583,
+              -0.067186035,
+              0.023143126,
+              -0.05054431,
+              -0.017398916,
+              -0.0058387746,
+              0.052131217,
+              -0.017985696,
+              -0.10168014,
+              0.016505243,
+              -0.005961273,
+              0.08834502,
+              0.047341425,
+              -0.06262999,
+              -0.03724901,
+              -0.0490674,
+              0.061806694,
+              -0.117662214,
+              0.014966754,
+              -0.07085228,
+              0.07317225,
+              -0.010064827,
+              -0.004601465,
+              0.0014379362,
+              0.0122654615,
+              -0.018565418,
+              0.018996973,
+              -0.0076706754,
+              -0.0085447915,
+              0.023833418,
+              -0.0074106916,
+              -0.04202295,
+              -0.008097604,
+              -0.0089935325,
+              0.11068735,
+              -0.028457392,
+              0.037548065,
+              0.04710371,
+              0.062597714,
+              -0.049594503,
+              0.06267496,
+              0.005339454,
+              0.024064569,
+              0.034303125,
+              -0.016984673,
+              -0.03375307,
+              0.012577206,
+              -0.05741818,
+              -0.046267692,
+              -0.00036155691,
+              0.02268587,
+              -0.109952465,
+              0.09230675,
+              0.048918508,
+              -0.044157643,
+              0.05441931,
+              -0.0058244704,
+              0.04833069,
+              0.035635386,
+              -0.015495411,
+              -0.008146981,
+              0.092891365,
+              0.112310715,
+              0.047900427,
+              -0.017513819,
+              -0.009520781,
+              0.06212363,
+              -0.0040008924,
+              0.00397841,
+              0.09532846,
+              -0.05659656,
+              -0.058885954,
+              -0.013697212,
+              0.009742546,
+              -0.04745855,
+              -0.061571207,
+              -0.085869245,
+              0.05009574,
+              -0.027810305,
+              -0.007983068,
+              -0.06844095,
+              0.032406274,
+              0.015316275,
+              0.0830624,
+              0.063605405,
+              -0.005157704,
+              -0.011889667,
+              -0.05187598,
+              -0.0087124705,
+              -0.031850815,
+              0.043204896,
+              0.00032051498,
+              -0.0012597291,
+              -2.3328516e-33,
+              -0.08486178,
+              0.023463517,
+              -0.05558325,
+              0.028823433,
+              0.0598007,
+              0.044241305,
+              -0.06976774,
+              -0.08749109,
+              -0.023545535,
+              0.0767821,
+              0.015185076,
+              0.019631226,
+              -0.058358442,
+              0.018799065,
+              0.0076146126,
+              -0.015977694,
+              -0.057259887,
+              -0.042667117,
+              0.101026215,
+              -0.03983678,
+              -0.03180352,
+              0.03177619,
+              -0.057957705,
+              -0.036778692,
+              0.027305948,
+              -0.0069477605,
+              -0.0753,
+              0.049428534,
+              0.012732314,
+              0.10010171,
+              -0.036260307,
+              -0.048061043,
+              0.029081684,
+              0.01795974,
+              0.045303203,
+              0.102590606,
+              0.005036657,
+              -0.05526093,
+              0.008327211,
+              -0.05970527,
+              0.020131486,
+              0.009408121,
+              -0.06648779,
+              -0.029893365,
+              0.0434368,
+              -0.0683305,
+              -0.07649664,
+              0.039999247,
+              -0.06477932,
+              0.07227491,
+              0.046653986,
+              -0.016773192,
+              -0.048649658,
+              -0.08454509,
+              -0.05255037,
+              0.0319589,
+              0.024662357,
+              0.023793997,
+              0.076360136,
+              -0.040995322,
+              -0.033935655,
+              -0.11416756,
+              0.06787201,
+              0.009610846,
+              -0.064101316,
+              0.024561828,
+              0.024906442,
+              -0.0041048713,
+              0.018717252,
+              -0.038110614,
+              0.0145301875,
+              0.068478055,
+              0.018691448,
+              0.05943308,
+              0.023695862,
+              -0.009747667,
+              -0.066519946,
+              0.0209059,
+              -0.019389415,
+              0.014860701,
+              0.022718104,
+              -0.022605024,
+              0.0105253365,
+              0.05693715,
+              0.07257885,
+              0.06504599,
+              -0.010055237,
+              0.07908256,
+              0.035240322,
+              -0.02378674,
+              0.017134566,
+              0.0878081,
+              0.005987074,
+              0.007431842,
+              -0.10935983,
+              -2.8794002e-08,
+              -0.05234688,
+              -0.08765063,
+              0.06662866,
+              0.013907749,
+              0.0999487,
+              -0.022422735,
+              0.06214868,
+              0.027856557,
+              -0.06424995,
+              -0.038701627,
+              0.025059296,
+              0.00807731,
+              -0.024077412,
+              0.011949065,
+              0.08715261,
+              0.012486595,
+              0.06470489,
+              -0.027933354,
+              0.039985545,
+              -0.012295149,
+              0.02333007,
+              -0.03250732,
+              -0.04260915,
+              0.10736886,
+              0.037696708,
+              -0.06628188,
+              -0.056817852,
+              -0.005238912,
+              -0.069547325,
+              0.100934796,
+              -0.033363372,
+              0.021774344,
+              0.017414633,
+              0.018075803,
+              0.026276791,
+              0.066073745,
+              0.059642654,
+              -0.065390244,
+              -0.115749314,
+              -0.07125786,
+              -0.023382567,
+              0.042660285,
+              0.043636538,
+              -0.03665277,
+              0.050204884,
+              0.0030947176,
+              0.057122562,
+              -0.034636553,
+              0.025459053,
+              -0.046185397,
+              -0.067215376,
+              0.06057241,
+              -0.041255984,
+              -0.019857686,
+              -0.013778329,
+              -0.06125949,
+              0.014752149,
+              -0.07630465,
+              -0.056748062,
+              0.0505062,
+              -0.036068004,
+              0.12241577,
+              0.06429002,
+              -0.038303368
             ],
             "index": 3,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/9e7a83d3d596.json b/tests/integration/recordings/responses/9e7a83d3d596.json
index 4965aa3c7..a9054d729 100644
--- a/tests/integration/recordings/responses/9e7a83d3d596.json
+++ b/tests/integration/recordings/responses/9e7a83d3d596.json
@@ -15,23 +15,23 @@
     "body": {
       "__type__": "openai.types.completion.Completion",
       "__data__": {
-        "id": "cmpl-43",
+        "id": "cmpl-775",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
-            "text": "Blue.\n\nMy response is based on the traditional English rhyme that pairs the colors of roses (red) with violets in a poetic and somewhat whimsical way. This specific version of the rhyme goes like this:\n\n\"Roses are red,\nViolets are blue,\nSugar is sweet,\nAnd so are you.\"\n\nIn modern times, variations of this rhyme can deviate from the original \"blue\" for violets, but in my complete sentence as requested, sticking with a widely recognized completion adds an air of timelessness and familiarity to the phrase."
+            "text": "Blue.\n\nMy response is based on the traditional rhyme \"Roses are Red, Violets are Blue,\" which is a well-known poem or phrase often used as a greeting or way to express affection. The exact wording may vary slightly depending on the source, but the general meaning remains the same: violets are typically depicted as blue-colored flowers in this rhyme."
           }
         ],
-        "created": 1754348148,
+        "created": 1756921025,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "text_completion",
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 113,
+          "completion_tokens": 75,
           "prompt_tokens": 50,
-          "total_tokens": 163,
+          "total_tokens": 125,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/9fadf5a3d68f.json b/tests/integration/recordings/responses/9fadf5a3d68f.json
index bc3c3ca22..aba45bcd3 100644
--- a/tests/integration/recordings/responses/9fadf5a3d68f.json
+++ b/tests/integration/recordings/responses/9fadf5a3d68f.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:14:22.168612Z",
+        "created_at": "2025-09-03T17:38:03.270261Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 198446125,
-        "load_duration": 31859666,
+        "total_duration": 244051875,
+        "load_duration": 111239500,
         "prompt_eval_count": 224,
-        "prompt_eval_duration": 151000000,
+        "prompt_eval_duration": 120962791,
         "eval_count": 2,
-        "eval_duration": 13000000,
+        "eval_duration": 11306292,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/a0c4df33879f.json b/tests/integration/recordings/responses/a0c4df33879f.json
index f134e0bed..7898e5b02 100644
--- a/tests/integration/recordings/responses/a0c4df33879f.json
+++ b/tests/integration/recordings/responses/a0c4df33879f.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -21,7 +21,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -36,7 +36,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081845,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -47,7 +47,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -62,7 +62,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081845,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -73,319 +73,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " word",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " for",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " Sun",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " is",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " \"",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": "Sol",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": ".\"",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " This",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " is",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081845,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " Roman",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081846,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -400,7 +88,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -411,7 +99,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -426,7 +114,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -437,7 +125,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -452,7 +140,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -463,7 +151,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -478,7 +166,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -489,11 +177,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": ",",
+                "content": " is",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -504,7 +192,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -515,11 +203,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " which",
+                "content": " Sol",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -530,7 +218,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -541,163 +229,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " was",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081846,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " later",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081846,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " adopted",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081846,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " into",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081846,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " many",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081846,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " languages",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081846,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -712,7 +244,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -723,7 +255,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -738,7 +270,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -749,11 +281,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " scientific",
+                "content": " ancient",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -764,7 +296,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -775,11 +307,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " contexts",
+                "content": " Roman",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -790,7 +322,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -801,7 +333,33 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " mythology",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921356,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -816,7 +374,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -827,11 +385,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " the",
+                "content": " Sol",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -842,7 +400,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081846,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -853,11 +411,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " official",
+                "content": " was",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -868,7 +426,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081847,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -879,579 +437,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " name",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " for",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " star",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " at",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " center",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " of",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " our",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " solar",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " system",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " is",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " simply",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " \"",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": "the",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " Sun",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": ",\"",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " but",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " \"",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": "Sol",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": "\"",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081847,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
-          "choices": [
-            {
-              "delta": {
-                "content": " remains",
-                "function_call": null,
-                "refusal": null,
-                "role": "assistant",
-                "tool_calls": null
-              },
-              "finish_reason": null,
-              "index": 0,
-              "logprobs": null
-            }
-          ],
-          "created": 1754081848,
-          "model": "llama3.2:3b-instruct-fp16",
-          "object": "chat.completion.chunk",
-          "service_tier": null,
-          "system_fingerprint": "fp_ollama",
-          "usage": null
-        }
-      },
-      {
-        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
-        "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -1466,7 +452,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1477,11 +463,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " commonly",
+                "content": " god",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1492,7 +478,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1503,11 +489,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " used",
+                "content": " equivalent",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1518,7 +504,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1529,11 +515,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " term",
+                "content": " to",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1544,7 +530,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1555,11 +541,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " in",
+                "content": " the",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1570,7 +556,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1581,11 +567,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " astronomy",
+                "content": " Greek",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1596,7 +582,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921356,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1607,7 +593,111 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " god",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921356,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " Hel",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921356,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": "ios",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -1622,7 +712,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921357,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1633,11 +723,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " classical",
+                "content": " he",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1648,7 +738,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921357,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1659,11 +749,11 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
-                "content": " studies",
+                "content": " was",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
@@ -1674,7 +764,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921357,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1685,7 +775,371 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " often",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " depicted",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " as",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " a",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " radi",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": "ating",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " sun",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " with",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " rays",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " eman",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": "ating",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " from",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " his",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " body",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -1700,7 +1154,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921357,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -1711,7 +1165,709 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-458",
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " The",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " term",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": "s",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": "olar",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921357,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": "\"",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " still",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " used",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " in",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " scientific",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " and",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " astronomical",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " contexts",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " refer",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " phenomena",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " related",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " to",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " Sun",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " or",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " solar",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": " system",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null
+            }
+          ],
+          "created": 1756921358,
+          "model": "llama3.2:3b-instruct-fp16",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": "fp_ollama",
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-792",
           "choices": [
             {
               "delta": {
@@ -1726,7 +1882,7 @@
               "logprobs": null
             }
           ],
-          "created": 1754081848,
+          "created": 1756921358,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/a4c8d19bb1eb.json b/tests/integration/recordings/responses/a4c8d19bb1eb.json
index a3aba2bff..89f52f82e 100644
--- a/tests/integration/recordings/responses/a4c8d19bb1eb.json
+++ b/tests/integration/recordings/responses/a4c8d19bb1eb.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-560",
+        "id": "chatcmpl-715",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "Hello! It's nice to meet you. How can I assist you today?",
+              "content": "Hello! It's nice to meet you. Is there something I can help you with or would you like to chat?",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,15 +37,15 @@
             }
           }
         ],
-        "created": 1754081856,
+        "created": 1756921367,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 17,
+          "completion_tokens": 25,
           "prompt_tokens": 29,
-          "total_tokens": 46,
+          "total_tokens": 54,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/a5187d9d5057.json b/tests/integration/recordings/responses/a5187d9d5057.json
index 0dedba066..edacd5fa6 100644
--- a/tests/integration/recordings/responses/a5187d9d5057.json
+++ b/tests/integration/recordings/responses/a5187d9d5057.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-64",
+        "id": "chatcmpl-376",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "You want to test the capabilities of the OpenAI Text-to-Text model (also known as T0).\n\nPlease note that I'll be using a pre-trained model, so my responses might not be entirely customized to your specific prompt or context. That being said, I'll do my best to mimic the behavior of the original model.\n\nWhat would you like to test or ask? Please provide a prompt or question, and I'll respond accordingly.\n\n(Note: if you'd like to run a longer experiment or try out specific models like text completion or code generation, feel free to let me know and we can figure out a way to collaborate.)",
+              "content": "I'll simulate a test for the LA-1030/5B linear accelerator, specifically for the H8 (High Voltage) model found in early models of the test rail. Note that this is not meant to be taken as actual test results but rather a demonstration.\n\n### Introduction:\nThe LA-1030/5B was used primarily for high-energy physics and nuclear research during the 1970s and 1980s. This linear accelerator was capable of producing proton beams with energies up to several GeV. The H8 model, also known as the 'High Voltage' component, is a series of power supplies that drive the high voltage DC (HV) accelerators.\n\n### Test Setup:\n\n- **Test Goal:** Measure the output of the LA-1030/5B H8 model linear accelerator and assess its ability to generate stable, high-voltage direct current (HVDC) to power it properly.\n  \n  - The setup consists of a single test rail containing one of these H8 modules. A precise DC voltage is supplied to the linear accelerator via an external DC source.\n\n### Operating Parameters:\n\n- **Input Voltage:** To ensure the linear accelerator operates within its safe operating parameters, input voltages will be varied from 20KV to 140KV.\n- **Current Delivery:** Monitoring current at these different output levels requires a precise multimeter or oscilloscope. \n- **Voltage Level and Current Stability:** The voltage should stabilize as close as possible to the desired output level.\n\n### Potential Issues\n\n1.) Over-Pressure in H8 Modules\n    - During high voltage levels, there's a risk of over-pressurization in the component casing due to the vacuum properties within the modules.\n    - Check for any external signs of stress or leakage.\n2.) Current Limitation and Arcing\n    - High current requirements demand close monitoring of the accelerator components and associated connections.\n    - An excessive arc can be detrimental to electronics connected to the system.\n3.) Interlocks and Safe Guards\n\n- **Ensure alignment:** Prevent accidental triggering.\n\n4.) Insulation integrity \n    - Potential risks from faulty or non-insulated components\n\n### Results Analysis:\n\nBased on this hypothetical test, some potential results could include:\n1.  Output voltage stability for the chosen input voltages\n2.  Ability to exceed the accelerator's highest voltage ratings.\n3. Consistency between different current levels at various output voltage tests.\n\nThis exercise is a general simulation and might not reflect real-world conditions or performance specifications of an actual LA-1030/5B linear accelerator. The focus here was on demonstrating how one could analyze data from such a system, given typical components involved in linear accelerators at that time period.",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,15 +37,15 @@
             }
           }
         ],
-        "created": 1754510052,
+        "created": 1756921225,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 129,
+          "completion_tokens": 547,
           "prompt_tokens": 31,
-          "total_tokens": 160,
+          "total_tokens": 578,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/a59d0d7c1485.json b/tests/integration/recordings/responses/a59d0d7c1485.json
index 80e2462d5..c951596ce 100644
--- a/tests/integration/recordings/responses/a59d0d7c1485.json
+++ b/tests/integration/recordings/responses/a59d0d7c1485.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:14:23.46316Z",
+        "created_at": "2025-09-03T17:38:04.367295Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 270313833,
-        "load_duration": 71668791,
+        "total_duration": 276503250,
+        "load_duration": 125852000,
         "prompt_eval_count": 238,
-        "prompt_eval_duration": 169000000,
+        "prompt_eval_duration": 138575125,
         "eval_count": 2,
-        "eval_duration": 25000000,
+        "eval_duration": 11277208,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/a6810c23eda8.json b/tests/integration/recordings/responses/a6810c23eda8.json
index 6d9747d28..d5b5c5a6d 100644
--- a/tests/integration/recordings/responses/a6810c23eda8.json
+++ b/tests/integration/recordings/responses/a6810c23eda8.json
@@ -23,7 +23,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:05.992185Z",
+          "created_at": "2025-09-03T17:36:13.985194Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -41,7 +41,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.047726Z",
+          "created_at": "2025-09-03T17:36:14.027686Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -59,7 +59,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.123375Z",
+          "created_at": "2025-09-03T17:36:14.068694Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -77,7 +77,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.182233Z",
+          "created_at": "2025-09-03T17:36:14.10959Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -95,7 +95,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.244655Z",
+          "created_at": "2025-09-03T17:36:14.150266Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -113,7 +113,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.304777Z",
+          "created_at": "2025-09-03T17:36:14.190959Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -131,7 +131,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.361584Z",
+          "created_at": "2025-09-03T17:36:14.231689Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -149,7 +149,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.419647Z",
+          "created_at": "2025-09-03T17:36:14.272328Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -167,7 +167,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.477037Z",
+          "created_at": "2025-09-03T17:36:14.312774Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -185,7 +185,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.534717Z",
+          "created_at": "2025-09-03T17:36:14.353348Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -203,7 +203,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.600289Z",
+          "created_at": "2025-09-03T17:36:14.393886Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -221,7 +221,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.658769Z",
+          "created_at": "2025-09-03T17:36:14.434753Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -239,7 +239,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.71323Z",
+          "created_at": "2025-09-03T17:36:14.474992Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -257,7 +257,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.764206Z",
+          "created_at": "2025-09-03T17:36:14.515133Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -275,7 +275,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.815428Z",
+          "created_at": "2025-09-03T17:36:14.555579Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -293,7 +293,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.86906Z",
+          "created_at": "2025-09-03T17:36:14.596355Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -311,7 +311,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.92191Z",
+          "created_at": "2025-09-03T17:36:14.637241Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -329,7 +329,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:06.97464Z",
+          "created_at": "2025-09-03T17:36:14.679196Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -347,7 +347,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.026686Z",
+          "created_at": "2025-09-03T17:36:14.719878Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -365,7 +365,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.078382Z",
+          "created_at": "2025-09-03T17:36:14.759719Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -383,7 +383,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.131717Z",
+          "created_at": "2025-09-03T17:36:14.79997Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -401,7 +401,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.188206Z",
+          "created_at": "2025-09-03T17:36:14.84053Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -419,7 +419,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.243218Z",
+          "created_at": "2025-09-03T17:36:14.881964Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -437,7 +437,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.298542Z",
+          "created_at": "2025-09-03T17:36:14.921986Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -455,7 +455,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.355167Z",
+          "created_at": "2025-09-03T17:36:14.962551Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -473,7 +473,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.41078Z",
+          "created_at": "2025-09-03T17:36:15.003226Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -491,7 +491,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.463639Z",
+          "created_at": "2025-09-03T17:36:15.043676Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -509,7 +509,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.515619Z",
+          "created_at": "2025-09-03T17:36:15.083952Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -527,7 +527,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.572461Z",
+          "created_at": "2025-09-03T17:36:15.124797Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -545,7 +545,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.626345Z",
+          "created_at": "2025-09-03T17:36:15.165202Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -563,7 +563,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.680673Z",
+          "created_at": "2025-09-03T17:36:15.205416Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -581,7 +581,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.736803Z",
+          "created_at": "2025-09-03T17:36:15.245854Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -599,7 +599,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.789556Z",
+          "created_at": "2025-09-03T17:36:15.286352Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -617,7 +617,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.841142Z",
+          "created_at": "2025-09-03T17:36:15.326952Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -635,7 +635,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.896607Z",
+          "created_at": "2025-09-03T17:36:15.367575Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -653,7 +653,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:07.953628Z",
+          "created_at": "2025-09-03T17:36:15.408069Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -671,7 +671,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:08.007575Z",
+          "created_at": "2025-09-03T17:36:15.448413Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -689,7 +689,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:08.061895Z",
+          "created_at": "2025-09-03T17:36:15.489223Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -707,7 +707,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:08.121698Z",
+          "created_at": "2025-09-03T17:36:15.530477Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -725,7 +725,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:08.175866Z",
+          "created_at": "2025-09-03T17:36:15.571317Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -743,7 +743,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:08.231661Z",
+          "created_at": "2025-09-03T17:36:15.612263Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -761,7 +761,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:08.285188Z",
+          "created_at": "2025-09-03T17:36:15.652533Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -779,15 +779,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:08.334914Z",
+          "created_at": "2025-09-03T17:36:15.692748Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 2543128958,
-          "load_duration": 133497375,
+          "total_duration": 1808812333,
+          "load_duration": 57887042,
           "prompt_eval_count": 18,
-          "prompt_eval_duration": 62000000,
+          "prompt_eval_duration": 42042750,
           "eval_count": 43,
-          "eval_duration": 2346000000,
+          "eval_duration": 1708293042,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/ae1c22f18ecc.json b/tests/integration/recordings/responses/ae1c22f18ecc.json
index 595b6668d..c9a47657b 100644
--- a/tests/integration/recordings/responses/ae1c22f18ecc.json
+++ b/tests/integration/recordings/responses/ae1c22f18ecc.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-07-31T17:59:32.661124541Z",
+        "created_at": "2025-09-03T17:41:47.144448Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 11391290133,
-        "load_duration": 42154800,
+        "total_duration": 2462760250,
+        "load_duration": 83668541,
         "prompt_eval_count": 20,
-        "prompt_eval_duration": 1208581216,
+        "prompt_eval_duration": 74227125,
         "eval_count": 58,
-        "eval_duration": 10140044676,
+        "eval_duration": 2304346166,
         "response": "I'm happy to help you with your test, but I don't see what kind of test we are testing. Could you please provide more context or clarify what kind of test you would like me to perform? Is it a programming test, a language proficiency test, or something else?",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/ae6835cfe70e.json b/tests/integration/recordings/responses/ae6835cfe70e.json
index 1bc383707..9766c6023 100644
--- a/tests/integration/recordings/responses/ae6835cfe70e.json
+++ b/tests/integration/recordings/responses/ae6835cfe70e.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-08-04T22:55:57.955211Z",
+        "created_at": "2025-09-03T17:42:18.871277Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 842946458,
-        "load_duration": 91343000,
+        "total_duration": 644170416,
+        "load_duration": 69749500,
         "prompt_eval_count": 386,
-        "prompt_eval_duration": 685000000,
+        "prompt_eval_duration": 531218583,
         "eval_count": 2,
-        "eval_duration": 64000000,
+        "eval_duration": 42446084,
         "response": "[]",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/b14ff438ca99.json b/tests/integration/recordings/responses/b14ff438ca99.json
index c445e7d42..180ec3286 100644
--- a/tests/integration/recordings/responses/b14ff438ca99.json
+++ b/tests/integration/recordings/responses/b14ff438ca99.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-07-31T17:51:39.104140157Z",
+        "created_at": "2025-09-03T17:39:59.708499Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 22895811031,
-        "load_duration": 41692686,
+        "total_duration": 5293681583,
+        "load_duration": 196095541,
         "prompt_eval_count": 23,
-        "prompt_eval_duration": 793961939,
+        "prompt_eval_duration": 72668042,
         "eval_count": 124,
-        "eval_duration": 22059637137,
+        "eval_duration": 5024327166,
         "response": "The official currency of Japan is the Japanese yen (\u00a5). It is abbreviated as \"JPY\" and its symbol is \u00a5. The yen is divided into 100 sen, although the sen has been officially discontinued since 1967.\n\nYou can exchange your money for yen at banks, currency exchange offices, or use ATMs to withdraw cash from an ATM. Credit cards are also widely accepted in Japan, especially among major retailers and restaurants.\n\nIt's worth noting that some businesses may not accept foreign currencies other than US dollars, so it's a good idea to have some local currency on hand when traveling to Japan.",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/b5e3ed420986.json b/tests/integration/recordings/responses/b5e3ed420986.json
index 871708ea0..f5a6e2400 100644
--- a/tests/integration/recordings/responses/b5e3ed420986.json
+++ b/tests/integration/recordings/responses/b5e3ed420986.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.054539014,
-              -0.016468922,
-              -0.010608761,
-              0.02301095,
-              0.011758054,
-              -0.11193683,
-              -0.0096305525,
-              0.019113416,
-              0.048967674,
-              -0.040160257,
-              -0.022335947,
-              0.016229406,
-              0.009204825,
-              0.05479278,
-              0.049229205,
-              -0.09585555,
-              -0.031133035,
-              -0.010217964,
-              -0.029166166,
-              -0.08954575,
-              -0.0006925836,
-              0.034955315,
-              0.016062167,
-              0.0034184188,
-              0.039653763,
-              -0.016046634,
-              -0.02841708,
-              0.021410936,
-              0.046111625,
-              -0.062207576,
-              -0.023055006,
-              0.1013955,
-              0.025184965,
-              -0.03625098,
-              -0.032918476,
-              0.03443538,
-              -0.01667641,
-              -0.066225745,
-              -0.06069369,
-              0.0005895856,
-              -0.063880995,
-              0.0077826553,
-              -0.0051208152,
-              -0.03670025,
-              -0.023568328,
-              0.07426548,
-              -0.017221872,
-              0.064796105,
-              -0.009619924,
-              -0.0011168239,
-              -0.0946396,
-              0.029776908,
-              -0.082821324,
-              -0.053136017,
-              -0.014514815,
-              -0.015186634,
-              0.03710505,
-              0.07176102,
-              -0.01892326,
-              -0.11193171,
-              -0.11862717,
-              0.029721867,
-              0.030640045,
-              0.103079796,
-              -0.02800051,
-              -0.045588907,
-              0.0014006048,
-              0.0046053855,
-              0.03230686,
-              -0.027150096,
-              -0.06602394,
-              -0.015831675,
-              0.019209974,
-              0.06880736,
-              0.04709176,
-              -0.105855644,
-              0.046280492,
-              -0.03096076,
-              -0.069832,
-              -0.014894174,
-              -0.0014720439,
-              0.026728554,
-              -0.04701634,
-              0.07608865,
-              0.05755428,
-              -0.020295804,
-              0.038703557,
-              0.06851399,
-              -0.068138964,
-              -0.017405631,
-              0.057037257,
-              -0.07952873,
-              -0.014248788,
-              0.0036484832,
-              -0.052898604,
-              0.049604755,
-              0.021487204,
-              0.035027836,
-              0.02545877,
-              -0.004785061,
-              0.051205274,
-              -0.08541501,
-              0.07143089,
-              0.04468161,
-              0.03930722,
-              -0.0135141155,
-              0.07088695,
-              -0.0660048,
-              0.0592439,
-              -0.023046793,
-              -0.027459674,
-              -0.04689379,
-              -0.037509903,
-              -0.0084943585,
-              0.05313619,
-              0.0038019137,
-              -0.02021957,
-              0.043566354,
-              -0.034341905,
-              0.042827673,
-              -0.007318655,
-              -0.0016014964,
-              0.04183553,
-              -0.025132777,
-              -0.03014748,
-              0.056046948,
-              -0.03387941,
-              -4.800238e-33,
-              0.008938797,
-              -0.105446324,
-              -0.022468172,
-              -0.0046421383,
-              0.10120766,
-              -0.024071503,
-              0.0720334,
-              0.00824967,
-              -0.017588114,
-              -0.012572595,
-              0.011187751,
-              0.09430494,
-              0.025195174,
-              0.061279986,
-              0.028598385,
-              0.07013615,
-              -0.028032323,
-              0.042044032,
-              0.012670473,
-              0.05118446,
-              0.069872275,
-              0.113011226,
-              0.06393332,
-              0.046133682,
-              0.00069346296,
-              -0.04742425,
-              -0.0076766815,
-              -0.016270984,
-              -0.03935856,
-              -0.0060400777,
-              -0.057824753,
-              -0.032809503,
-              0.030087646,
-              0.04949177,
-              0.0065082232,
-              -0.015118406,
-              0.027426325,
-              -0.13929617,
-              0.04686397,
-              -0.0001376871,
-              0.023311358,
-              0.014268379,
-              0.0005033175,
-              -0.019155173,
-              -0.021629533,
-              0.012334637,
-              -0.035448097,
-              -0.015012808,
-              -0.12478333,
-              0.017866643,
-              -0.015385203,
-              -0.030914769,
-              0.07756115,
-              0.067938074,
-              -0.0029891697,
-              0.03446983,
-              0.072096206,
-              -0.008727331,
-              -0.0039063273,
-              -0.048090436,
-              0.021224795,
-              0.065839365,
-              0.07848987,
-              0.014581675,
-              0.06676033,
-              0.07221585,
-              0.033575963,
-              0.08418111,
-              0.016567666,
-              0.042123966,
-              -0.05935007,
-              0.020415181,
-              -0.06571829,
-              0.04579863,
-              0.002951678,
-              0.0034759378,
-              -0.008463108,
-              -0.14008056,
-              0.056221444,
-              0.05469431,
-              -0.060425404,
-              -0.035049956,
-              -0.05707458,
-              -0.010413291,
-              -0.08953148,
-              -0.023625003,
-              0.034471046,
-              0.033661205,
-              0.06720743,
-              -0.07255193,
-              -0.041828338,
-              -0.08223931,
-              0.010640704,
-              -0.042891644,
-              -0.0014475408,
-              8.39199e-34,
-              -0.07032797,
-              0.0070702634,
-              -0.035070483,
-              0.021509597,
-              -0.11257678,
-              -0.04567272,
-              0.08481507,
-              0.050335176,
-              0.053387776,
-              0.012060723,
-              -0.0019196937,
-              -0.08608223,
-              0.09600442,
-              0.0037239613,
-              0.060983595,
-              0.015279161,
-              -0.040586337,
-              0.10490671,
-              0.07111468,
-              -0.0050306814,
-              -0.048980962,
-              0.09183541,
-              -0.09862482,
-              -0.012065119,
-              -0.016891332,
-              -0.028088856,
-              -0.12471142,
-              -0.078602985,
-              -0.018680012,
-              0.021758018,
-              0.005759521,
-              0.051118605,
-              -0.082707904,
-              0.072964445,
-              0.0141024105,
-              0.0010097212,
-              -0.03685827,
-              0.00568948,
-              0.017905025,
-              0.013780462,
-              0.04993993,
-              0.021444008,
-              0.110891685,
-              0.061709184,
-              0.01853852,
-              0.036215156,
-              -0.06684297,
-              0.036332514,
-              -0.021102918,
-              -0.07972151,
-              0.065229,
-              0.0030138723,
-              0.018853001,
-              -0.008725459,
-              -0.058164038,
-              -0.040056095,
-              0.051841468,
-              0.016301498,
-              -0.08781288,
-              -0.02227259,
-              -0.013245076,
-              -0.03801183,
-              0.025480323,
-              0.030531729,
-              -0.054035358,
-              0.04038695,
-              -0.116109855,
-              -0.026073342,
-              -0.0043725744,
-              -0.15029478,
-              0.08059584,
-              -0.05766878,
-              0.02516043,
-              -0.0038830324,
-              -0.064506546,
-              0.020497749,
-              -0.034779944,
-              -0.02932536,
-              -0.052795924,
-              0.05048031,
-              -0.036627516,
-              -0.009295713,
-              -0.03128295,
-              -0.0010504925,
-              -0.089731686,
-              0.044538505,
-              -0.058741618,
-              0.028392328,
-              0.05705406,
-              -0.021216048,
-              0.024795407,
-              0.023279097,
-              -0.025490018,
-              0.066466905,
-              0.011147595,
-              -1.57812e-08,
-              -0.043579992,
-              0.050845813,
-              0.009048856,
-              0.036609128,
-              0.0027812773,
-              0.03891625,
-              -0.013210705,
-              0.0068475637,
-              -0.0067914757,
-              0.020505553,
-              -0.029885264,
-              -0.0055864784,
-              -0.06776668,
-              -0.054356683,
-              0.024375776,
-              0.13760787,
-              -0.07139099,
-              0.007762989,
-              0.051617414,
-              0.05973323,
-              0.042459413,
-              -0.03560275,
-              -0.05791632,
-              0.04441552,
-              -0.10566783,
-              0.009725281,
-              -0.016063722,
-              0.035676833,
-              0.023308199,
-              -0.079277165,
-              0.0054484066,
-              -0.060464006,
-              -0.044717573,
-              0.013122884,
-              -0.015911829,
-              -0.012086337,
-              0.005874884,
-              -0.070992075,
-              0.017624497,
-              0.036101837,
-              0.023521954,
-              -0.007950616,
-              -0.036010865,
-              0.0059945653,
-              0.059922658,
-              0.0058807023,
-              -0.058820717,
-              -0.04119291,
-              -0.038226888,
-              -0.03001563,
-              0.019165142,
-              -0.020903448,
-              -0.0089449985,
-              -0.02588891,
-              0.08723996,
-              0.04226809,
-              -0.09462471,
-              -0.0349857,
-              0.05150947,
-              0.04254913,
-              -0.01820297,
-              0.06036542,
-              0.19380692,
-              0.014680669
+              -0.054516047,
+              -0.016456056,
+              -0.010628294,
+              0.022998175,
+              0.011771307,
+              -0.11192805,
+              -0.009638266,
+              0.019111464,
+              0.048958372,
+              -0.040184658,
+              -0.022362057,
+              0.016236247,
+              0.009179422,
+              0.054799747,
+              0.049246185,
+              -0.095869735,
+              -0.031108288,
+              -0.010185289,
+              -0.02914681,
+              -0.08954776,
+              -0.0006788293,
+              0.03496997,
+              0.016079746,
+              0.003440155,
+              0.039660316,
+              -0.016080642,
+              -0.028411511,
+              0.021429215,
+              0.046082154,
+              -0.062199906,
+              -0.023051145,
+              0.10141082,
+              0.025186997,
+              -0.03625052,
+              -0.032918967,
+              0.034433577,
+              -0.016646268,
+              -0.066217534,
+              -0.06070787,
+              0.0006243064,
+              -0.06383077,
+              0.0077886702,
+              -0.005127284,
+              -0.036702275,
+              -0.023532037,
+              0.074247204,
+              -0.017199293,
+              0.064781435,
+              -0.00963324,
+              -0.0011216484,
+              -0.094671436,
+              0.029772488,
+              -0.0828219,
+              -0.053136364,
+              -0.014507852,
+              -0.015170829,
+              0.03712605,
+              0.071739994,
+              -0.018907284,
+              -0.11193762,
+              -0.11859575,
+              0.029719124,
+              0.030655412,
+              0.10308374,
+              -0.027978238,
+              -0.045611758,
+              0.0013704232,
+              0.004602404,
+              0.032320693,
+              -0.027153788,
+              -0.06603313,
+              -0.015827695,
+              0.01920783,
+              0.06879109,
+              0.047088612,
+              -0.1058506,
+              0.046279814,
+              -0.030967912,
+              -0.06984916,
+              -0.014879451,
+              -0.0014568317,
+              0.026731879,
+              -0.04702097,
+              0.076069675,
+              0.05755153,
+              -0.020301627,
+              0.038702164,
+              0.06855233,
+              -0.06817319,
+              -0.017392006,
+              0.057020444,
+              -0.0795406,
+              -0.014256318,
+              0.0036161602,
+              -0.05289696,
+              0.049625576,
+              0.021482797,
+              0.034989595,
+              0.025457244,
+              -0.004806878,
+              0.051217325,
+              -0.085426696,
+              0.07142323,
+              0.04465428,
+              0.039311107,
+              -0.013488202,
+              0.07088864,
+              -0.06598805,
+              0.05922822,
+              -0.023026757,
+              -0.027465338,
+              -0.046879534,
+              -0.03751372,
+              -0.0085191075,
+              0.05315477,
+              0.0037932945,
+              -0.020239882,
+              0.043557003,
+              -0.03434906,
+              0.04282584,
+              -0.007332412,
+              -0.0016165953,
+              0.041878954,
+              -0.025151564,
+              -0.0301328,
+              0.05601688,
+              -0.03388191,
+              -4.802144e-33,
+              0.008930927,
+              -0.10549414,
+              -0.022485359,
+              -0.00461374,
+              0.10122854,
+              -0.024063904,
+              0.072040126,
+              0.00826307,
+              -0.017573163,
+              -0.012551788,
+              0.011197847,
+              0.09432378,
+              0.025232295,
+              0.061275084,
+              0.028605146,
+              0.070148624,
+              -0.028050693,
+              0.042055413,
+              0.012653081,
+              0.051212482,
+              0.06987365,
+              0.113007665,
+              0.063927636,
+              0.04614841,
+              0.00071471,
+              -0.04746817,
+              -0.007670411,
+              -0.016275087,
+              -0.039374933,
+              -0.0060473024,
+              -0.057836913,
+              -0.032802302,
+              0.030103875,
+              0.049495216,
+              0.006514002,
+              -0.015127479,
+              0.027406687,
+              -0.13926439,
+              0.04688173,
+              -0.00014261098,
+              0.023295157,
+              0.014260961,
+              0.00048042598,
+              -0.019151432,
+              -0.02166308,
+              0.012344319,
+              -0.03541818,
+              -0.014996304,
+              -0.12476534,
+              0.017857043,
+              -0.015367026,
+              -0.030933712,
+              0.0775453,
+              0.067932405,
+              -0.002991927,
+              0.034482367,
+              0.07207725,
+              -0.008732087,
+              -0.0038812195,
+              -0.048092995,
+              0.021236168,
+              0.06584243,
+              0.07847724,
+              0.014562048,
+              0.066736475,
+              0.07221872,
+              0.03357779,
+              0.084165,
+              0.01657892,
+              0.04212138,
+              -0.059364557,
+              0.020403123,
+              -0.065706775,
+              0.045810685,
+              0.0029439582,
+              0.0034878643,
+              -0.008467763,
+              -0.14005418,
+              0.056226924,
+              0.05473064,
+              -0.060421,
+              -0.035074305,
+              -0.05707729,
+              -0.0104098,
+              -0.089569785,
+              -0.023614792,
+              0.0344653,
+              0.033663824,
+              0.06720568,
+              -0.0725603,
+              -0.04185905,
+              -0.08224899,
+              0.010631505,
+              -0.042881776,
+              -0.0014539668,
+              8.40692e-34,
+              -0.07032476,
+              0.0070766173,
+              -0.03506184,
+              0.021500606,
+              -0.11258514,
+              -0.045659322,
+              0.08482931,
+              0.050339974,
+              0.0533988,
+              0.01208183,
+              -0.0019384808,
+              -0.0860773,
+              0.09599927,
+              0.0037235345,
+              0.060938608,
+              0.015288853,
+              -0.040593054,
+              0.10491757,
+              0.07109598,
+              -0.0050172145,
+              -0.049021836,
+              0.091859885,
+              -0.09862007,
+              -0.012040684,
+              -0.016914355,
+              -0.028067894,
+              -0.12471722,
+              -0.078632146,
+              -0.018693453,
+              0.021743925,
+              0.0057838396,
+              0.051090635,
+              -0.08270728,
+              0.07299018,
+              0.014088154,
+              0.0010067249,
+              -0.03681869,
+              0.005664378,
+              0.017898101,
+              0.01379136,
+              0.049959406,
+              0.021462437,
+              0.11088524,
+              0.061694097,
+              0.018546695,
+              0.036211833,
+              -0.06682083,
+              0.036322806,
+              -0.021121122,
+              -0.079697676,
+              0.065231666,
+              0.002995329,
+              0.0188468,
+              -0.008694769,
+              -0.058170997,
+              -0.040058907,
+              0.051831294,
+              0.016280394,
+              -0.08779952,
+              -0.022270929,
+              -0.013231236,
+              -0.03801554,
+              0.0254927,
+              0.030549657,
+              -0.054053955,
+              0.040396415,
+              -0.116118245,
+              -0.026093038,
+              -0.004378966,
+              -0.15024145,
+              0.08058958,
+              -0.05766716,
+              0.02520104,
+              -0.0038984206,
+              -0.06448939,
+              0.020477816,
+              -0.034754846,
+              -0.029315596,
+              -0.052802563,
+              0.050487537,
+              -0.03663958,
+              -0.009309272,
+              -0.031305738,
+              -0.0010610216,
+              -0.089741714,
+              0.0445201,
+              -0.058746234,
+              0.028397618,
+              0.057035178,
+              -0.021242462,
+              0.024774676,
+              0.023253858,
+              -0.025503494,
+              0.066465355,
+              0.011176001,
+              -1.5780694e-08,
+              -0.043592602,
+              0.050871234,
+              0.009062051,
+              0.03658537,
+              0.002769079,
+              0.038917493,
+              -0.013205564,
+              0.006855097,
+              -0.006784634,
+              0.020516934,
+              -0.029890155,
+              -0.005596517,
+              -0.06777992,
+              -0.05436433,
+              0.02436097,
+              0.13761573,
+              -0.07139558,
+              0.007746665,
+              0.051632155,
+              0.059728563,
+              0.0424793,
+              -0.035606194,
+              -0.05791164,
+              0.044417217,
+              -0.105627485,
+              0.009701339,
+              -0.016052725,
+              0.03566595,
+              0.023313522,
+              -0.079250954,
+              0.0054293363,
+              -0.060480006,
+              -0.044735,
+              0.013152052,
+              -0.015912784,
+              -0.012098195,
+              0.0058634495,
+              -0.070984975,
+              0.017616477,
+              0.03611389,
+              0.023517592,
+              -0.007936504,
+              -0.03601146,
+              0.0059993765,
+              0.059939068,
+              0.0058700717,
+              -0.05880679,
+              -0.04119574,
+              -0.038231015,
+              -0.030013425,
+              0.01916342,
+              -0.020920184,
+              -0.008940394,
+              -0.025874808,
+              0.08722286,
+              0.042265054,
+              -0.09463029,
+              -0.034977533,
+              0.05149754,
+              0.042541843,
+              -0.01818799,
+              0.06035198,
+              0.1938343,
+              0.01467125
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/b612debbd3bf.json b/tests/integration/recordings/responses/b612debbd3bf.json
index 0b73eaf31..4c39a78f1 100644
--- a/tests/integration/recordings/responses/b612debbd3bf.json
+++ b/tests/integration/recordings/responses/b612debbd3bf.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.003989132,
-              0.051404107,
-              -0.00056249514,
-              -0.038048144,
-              0.00023617804,
-              -0.07165115,
-              -0.032934345,
-              0.029131265,
-              0.089478746,
-              0.027012052,
-              0.022988115,
-              0.029467529,
-              0.013449345,
-              0.02187333,
-              0.024701167,
-              0.02318687,
-              -0.067904875,
-              0.042214446,
-              -0.06686454,
-              -0.044817198,
-              -0.019499827,
-              -0.017647728,
-              -0.047033403,
-              0.01010371,
-              -0.035198584,
-              0.1279292,
-              -0.03992792,
-              -0.03702997,
-              0.021821143,
-              -0.06663628,
-              0.020529605,
-              0.03141518,
-              0.121698014,
-              0.037880983,
-              -0.07562467,
-              0.035962664,
-              0.11100028,
-              -0.025674157,
-              -0.0779127,
-              0.016963888,
-              -0.0807954,
-              0.042507604,
-              0.00820509,
-              0.07316419,
-              0.01111272,
-              0.01623341,
-              0.019468198,
-              -0.05727617,
-              -0.026948903,
-              0.02756721,
-              -0.10366233,
-              0.061819006,
-              -0.02805692,
-              0.04555006,
-              0.038514387,
-              0.102219224,
-              0.010187554,
-              0.0038878673,
-              -0.07438772,
-              -0.009772767,
-              -0.014589378,
-              0.005427063,
-              -0.04896932,
-              0.024673788,
-              0.08042059,
-              -0.0013942291,
-              0.0008588407,
-              0.0016949617,
-              0.016265066,
-              0.0036070896,
-              0.05801152,
-              -0.010051563,
-              -0.008403578,
-              0.06814287,
-              0.03398574,
-              -0.011672763,
-              -0.049353864,
-              -0.034604926,
-              0.022498535,
-              0.016111419,
-              0.02527047,
-              0.03502525,
-              -0.018208683,
-              0.068031214,
-              0.059953574,
-              -0.025391363,
-              0.04580482,
-              -0.04296594,
-              -0.10485879,
-              -0.028135728,
-              0.079018995,
-              -0.01712349,
-              0.012407565,
-              0.04061926,
-              -0.020135157,
-              0.026930887,
-              0.041811634,
-              -0.04416108,
-              0.080970354,
-              0.021775935,
-              0.081765614,
-              0.033288363,
-              0.021744251,
-              0.0920779,
-              -0.052091073,
-              -0.13620377,
-              0.01355201,
-              -0.019836528,
-              -0.03622741,
-              -0.050273415,
-              -0.03297705,
-              0.046637394,
-              -0.062427662,
-              -0.05683662,
-              -0.027652364,
-              -0.15121156,
-              -0.09399186,
-              -0.011023118,
-              -0.024265675,
-              -0.046763826,
-              -0.002908067,
-              -0.066486366,
-              -0.025612496,
-              0.018278103,
-              0.0020231954,
-              -0.062278572,
-              -0.11748546,
-              -4.4292726e-33,
-              -0.009130088,
-              -0.037159156,
-              -0.026047857,
-              0.052019667,
-              0.00085722556,
-              0.006592443,
-              -0.0045248135,
-              -0.04015857,
-              0.004117024,
-              0.0428665,
-              -0.049716696,
-              0.045335494,
-              0.042848498,
-              0.044919603,
-              0.11100728,
-              0.021570923,
-              -0.031257298,
-              0.07225882,
-              -0.01912497,
-              -0.034713253,
-              0.06771385,
-              -0.016151445,
-              0.05971066,
-              -0.022954458,
-              0.028852448,
-              0.015406495,
-              -0.00031955744,
-              -0.012751747,
-              -0.03327897,
-              -0.00012636236,
-              -0.02479355,
-              -0.042213496,
-              -0.002454921,
-              0.041260865,
-              0.0919246,
-              0.06857511,
-              -0.0152807245,
-              -0.12649235,
-              0.016997697,
-              -0.08620996,
-              0.055064507,
-              0.030273788,
-              0.00431866,
-              0.031995468,
-              -0.03225614,
-              0.004922506,
-              0.009020533,
-              -0.023137338,
-              -0.040697925,
-              -0.09105851,
-              0.03639921,
-              0.024429396,
-              0.013554936,
-              0.032427397,
-              0.04099883,
-              0.037522644,
-              -0.041546755,
-              -0.079021014,
-              -0.053779483,
-              0.06449904,
-              -0.08023162,
-              0.021288263,
-              0.062299646,
-              0.0457609,
-              0.03245626,
-              0.08930955,
-              -0.040566627,
-              -0.031877786,
-              0.09784694,
-              0.018440586,
-              0.0055373674,
-              0.033386778,
-              -0.069314316,
-              0.0050042598,
-              -0.011121069,
-              0.04041817,
-              -0.018704956,
-              -0.06160915,
-              -0.019937823,
-              0.05572433,
-              -0.033941865,
-              -0.03284764,
-              0.039774805,
-              0.032533348,
-              -0.014803814,
-              -0.04081455,
-              0.090428285,
-              -0.07119735,
-              -0.045317948,
-              0.0044284705,
-              -0.011297022,
-              0.010466631,
-              -0.0050936122,
-              -0.032272205,
-              -0.014571677,
-              1.9730937e-33,
-              -0.014730757,
-              -0.011375904,
-              -0.018987043,
-              -0.030017996,
-              -0.03238378,
-              0.00021963792,
-              -0.012572021,
-              -0.121466525,
-              0.0020859565,
-              0.031917855,
-              -0.0047694035,
-              0.009451863,
-              0.07091064,
-              -0.10059175,
-              0.025064182,
-              0.06191513,
-              -0.0040704445,
-              -0.09924964,
-              -0.011796679,
-              -0.047690243,
-              -0.030504584,
-              0.06266709,
-              -0.07385124,
-              -0.0061550937,
-              -0.01423386,
-              0.0073556406,
-              -0.12380783,
-              -0.12357105,
-              0.049844977,
-              0.013651552,
-              -0.042339053,
-              -0.05773099,
-              0.008854461,
-              -0.039381962,
-              -0.010391537,
-              0.01995317,
-              0.06865881,
-              -0.0034758614,
-              0.034933414,
-              0.016901772,
-              -0.041236185,
-              0.1275965,
-              -0.010944973,
-              -0.038379222,
-              0.03352998,
-              0.024260346,
-              -0.009189018,
-              0.08945688,
-              -0.037322775,
-              -0.033685952,
-              0.083590224,
-              0.024379434,
-              0.013052954,
-              -0.082478285,
-              0.081726134,
-              0.025851976,
-              -0.040732652,
-              0.011625263,
-              0.045134045,
-              0.05800952,
-              -0.043148052,
-              -0.02189082,
-              0.0076365937,
-              0.07503425,
-              -0.0371004,
-              -0.04029487,
-              -0.044494897,
-              -0.10995023,
-              -0.024031844,
-              -0.08961193,
-              0.020242436,
-              0.030619737,
-              -0.021178389,
-              0.04682225,
-              -0.08384518,
-              -0.04420498,
-              -0.041840017,
-              0.031129008,
-              0.010757745,
-              0.06393576,
-              -0.0031622013,
-              -0.012325239,
-              0.03960315,
-              0.038744513,
-              0.04009258,
-              0.012087899,
-              0.060512736,
-              -0.04624927,
-              0.00929668,
-              -0.051231515,
-              -0.0496359,
-              -0.015559894,
-              -0.08582702,
-              0.07392022,
-              -0.02927744,
-              -1.4551534e-08,
-              -0.060233776,
-              -0.056502644,
-              -0.0039323824,
-              -0.030575769,
-              0.033688147,
-              -0.051516674,
-              0.011328192,
-              0.14126065,
-              0.02396768,
-              0.019315943,
-              0.06601706,
-              0.030757405,
-              -0.106958,
-              0.0033853063,
-              0.073158585,
-              0.024177559,
-              0.08089344,
-              -0.078784004,
-              -0.032134753,
-              0.07526011,
-              0.054319587,
-              0.009856976,
-              -0.12708029,
-              0.06313889,
-              0.09004333,
-              -0.0015960654,
-              0.058387086,
-              0.059561662,
-              -0.0047651688,
-              0.0229759,
-              0.03569084,
-              -0.034010228,
-              0.07279012,
-              0.07974487,
-              0.091203436,
-              0.022210982,
-              0.04596847,
-              0.044025153,
-              -0.083589375,
-              -0.10002216,
-              0.020842535,
-              0.023079954,
-              -0.04795557,
-              0.08441458,
-              0.0771154,
-              0.009332128,
-              -0.08095578,
-              0.092889085,
-              -0.020154007,
-              -0.0008010522,
-              -0.03861009,
-              0.016097447,
-              0.0070208795,
-              -0.017685603,
-              -0.002207989,
-              -0.02192508,
-              0.033382397,
-              -0.03214206,
-              -0.012332422,
-              -0.002134471,
-              0.021111421,
-              0.016544258,
-              0.017546006,
-              -0.07716502
+              -0.003961408,
+              0.051414188,
+              -0.00058039324,
+              -0.03805786,
+              0.00026862609,
+              -0.07164569,
+              -0.032947958,
+              0.029143414,
+              0.0895043,
+              0.027018296,
+              0.022992423,
+              0.029479899,
+              0.013462918,
+              0.021877697,
+              0.024697151,
+              0.023186686,
+              -0.06790505,
+              0.042193525,
+              -0.0668863,
+              -0.04484601,
+              -0.019504927,
+              -0.017638002,
+              -0.047011577,
+              0.010105266,
+              -0.035193082,
+              0.12793653,
+              -0.03992006,
+              -0.03702981,
+              0.021819357,
+              -0.06665871,
+              0.020533124,
+              0.03142357,
+              0.121719204,
+              0.037876442,
+              -0.075640336,
+              0.0359664,
+              0.11100785,
+              -0.02567441,
+              -0.07788109,
+              0.016981006,
+              -0.08081605,
+              0.042523988,
+              0.008232587,
+              0.0731737,
+              0.011123085,
+              0.016207846,
+              0.01944517,
+              -0.057269264,
+              -0.026940528,
+              0.027561199,
+              -0.103662655,
+              0.06181235,
+              -0.028062372,
+              0.04553612,
+              0.038513146,
+              0.10225101,
+              0.010200513,
+              0.003872203,
+              -0.074381135,
+              -0.0097752875,
+              -0.014599097,
+              0.0054576746,
+              -0.04897588,
+              0.024681844,
+              0.08043012,
+              -0.0014103616,
+              0.0008604012,
+              0.0016741438,
+              0.016251745,
+              0.00360708,
+              0.058014695,
+              -0.010049014,
+              -0.0084027,
+              0.06814959,
+              0.033971835,
+              -0.011656133,
+              -0.04935883,
+              -0.03459291,
+              0.022477727,
+              0.01610207,
+              0.025287844,
+              0.03501659,
+              -0.018194117,
+              0.06807382,
+              0.059983365,
+              -0.025374522,
+              0.04583719,
+              -0.04297365,
+              -0.104865946,
+              -0.028109012,
+              0.079001896,
+              -0.017114554,
+              0.012419278,
+              0.04061318,
+              -0.020101532,
+              0.026956845,
+              0.041828763,
+              -0.044170532,
+              0.08095696,
+              0.021788325,
+              0.081747636,
+              0.033276387,
+              0.021741632,
+              0.092068955,
+              -0.05207143,
+              -0.13620017,
+              0.013549487,
+              -0.019821124,
+              -0.036206715,
+              -0.050286006,
+              -0.032959178,
+              0.04662646,
+              -0.062424622,
+              -0.056837536,
+              -0.027646665,
+              -0.15120761,
+              -0.093959294,
+              -0.010999317,
+              -0.02427833,
+              -0.046769585,
+              -0.002897303,
+              -0.06647176,
+              -0.025597623,
+              0.018255977,
+              0.0020313214,
+              -0.06226326,
+              -0.117481604,
+              -4.4295206e-33,
+              -0.009129055,
+              -0.037181977,
+              -0.02604801,
+              0.052037112,
+              0.00087297254,
+              0.0065994835,
+              -0.0045263134,
+              -0.040167294,
+              0.0041152886,
+              0.042845216,
+              -0.049708433,
+              0.045345027,
+              0.04285296,
+              0.044911012,
+              0.11100636,
+              0.021593297,
+              -0.03125754,
+              0.072277226,
+              -0.01916381,
+              -0.03471753,
+              0.06770263,
+              -0.016145714,
+              0.05970865,
+              -0.02298266,
+              0.028831182,
+              0.015415605,
+              -0.00031274176,
+              -0.012733097,
+              -0.03328956,
+              -0.00013622487,
+              -0.024770694,
+              -0.042212497,
+              -0.0024302523,
+              0.04124051,
+              0.09191475,
+              0.06856497,
+              -0.015284932,
+              -0.12650564,
+              0.017038988,
+              -0.086213395,
+              0.05503028,
+              0.030287316,
+              0.0043085497,
+              0.03199775,
+              -0.032243066,
+              0.004920853,
+              0.009013211,
+              -0.023148343,
+              -0.04070659,
+              -0.091041416,
+              0.036388315,
+              0.024427423,
+              0.013590955,
+              0.032416057,
+              0.040976506,
+              0.037508775,
+              -0.041537814,
+              -0.0790035,
+              -0.05377612,
+              0.06448428,
+              -0.080218546,
+              0.021294411,
+              0.062302276,
+              0.045776673,
+              0.032483075,
+              0.08931608,
+              -0.04060625,
+              -0.031852096,
+              0.09785858,
+              0.01842136,
+              0.005539284,
+              0.033401128,
+              -0.069316946,
+              0.0050071795,
+              -0.01113226,
+              0.04040353,
+              -0.018702384,
+              -0.061634906,
+              -0.019955046,
+              0.055725593,
+              -0.0339558,
+              -0.03284888,
+              0.039789777,
+              0.032518264,
+              -0.014831044,
+              -0.040828414,
+              0.09042645,
+              -0.07117855,
+              -0.0452999,
+              0.004429679,
+              -0.011286574,
+              0.010456636,
+              -0.005107356,
+              -0.03228427,
+              -0.014561991,
+              1.973978e-33,
+              -0.014741807,
+              -0.011373571,
+              -0.018968971,
+              -0.030024195,
+              -0.032379575,
+              0.00021643718,
+              -0.012567692,
+              -0.121494584,
+              0.0020773544,
+              0.03192013,
+              -0.004760303,
+              0.0094626825,
+              0.070903994,
+              -0.10057645,
+              0.025073227,
+              0.0619163,
+              -0.0040503214,
+              -0.099229865,
+              -0.011797051,
+              -0.04770035,
+              -0.030485118,
+              0.06268395,
+              -0.073855996,
+              -0.0061467164,
+              -0.01423362,
+              0.0073681897,
+              -0.12381955,
+              -0.12358002,
+              0.049814835,
+              0.013639601,
+              -0.04231122,
+              -0.057728436,
+              0.008867639,
+              -0.03936158,
+              -0.010378862,
+              0.01995126,
+              0.06864242,
+              -0.0034683226,
+              0.034935873,
+              0.01691657,
+              -0.041248,
+              0.12756771,
+              -0.0109369,
+              -0.038407195,
+              0.03351686,
+              0.024284633,
+              -0.009186648,
+              0.089450404,
+              -0.037300985,
+              -0.033677705,
+              0.083595864,
+              0.024388704,
+              0.013052032,
+              -0.082466476,
+              0.08174954,
+              0.025851287,
+              -0.0407412,
+              0.011634866,
+              0.045149248,
+              0.057999264,
+              -0.043137826,
+              -0.0218611,
+              0.007614091,
+              0.075013876,
+              -0.037117332,
+              -0.040271968,
+              -0.044543337,
+              -0.10995435,
+              -0.024011672,
+              -0.08962033,
+              0.020206504,
+              0.030622963,
+              -0.021175418,
+              0.046819735,
+              -0.08388905,
+              -0.04419095,
+              -0.041822553,
+              0.031128531,
+              0.010744972,
+              0.06392119,
+              -0.0031621107,
+              -0.012324199,
+              0.039583333,
+              0.03872388,
+              0.04003792,
+              0.012126796,
+              0.060538515,
+              -0.046224117,
+              0.009284271,
+              -0.051235553,
+              -0.049639463,
+              -0.015559349,
+              -0.08584357,
+              0.07390804,
+              -0.029281551,
+              -1.4552155e-08,
+              -0.060234137,
+              -0.05653537,
+              -0.003924483,
+              -0.030553697,
+              0.033688337,
+              -0.051516354,
+              0.011325061,
+              0.14125879,
+              0.0239569,
+              0.01933575,
+              0.066012196,
+              0.030753234,
+              -0.10696803,
+              0.0034088665,
+              0.073148385,
+              0.02414587,
+              0.080867074,
+              -0.07877004,
+              -0.032145467,
+              0.07524812,
+              0.0542984,
+              0.009829384,
+              -0.1270656,
+              0.06314169,
+              0.09003407,
+              -0.0016169662,
+              0.058391552,
+              0.059590362,
+              -0.0047688517,
+              0.022996303,
+              0.035714924,
+              -0.034012605,
+              0.07277301,
+              0.0797266,
+              0.0912049,
+              0.022215161,
+              0.045965668,
+              0.04404474,
+              -0.083592154,
+              -0.10004596,
+              0.020836696,
+              0.023092525,
+              -0.047950342,
+              0.08443384,
+              0.0771323,
+              0.009310225,
+              -0.080956854,
+              0.09289323,
+              -0.020150434,
+              -0.00083508895,
+              -0.038630493,
+              0.01606296,
+              0.007031474,
+              -0.01770303,
+              -0.0022343053,
+              -0.021911092,
+              0.03337036,
+              -0.032134622,
+              -0.012314019,
+              -0.0021285508,
+              0.021125747,
+              0.016543584,
+              0.01756058,
+              -0.0771557
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/bd356b27a085.json b/tests/integration/recordings/responses/bd356b27a085.json
index 58da672f0..f372e5af9 100644
--- a/tests/integration/recordings/responses/bd356b27a085.json
+++ b/tests/integration/recordings/responses/bd356b27a085.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.850399Z",
+          "created_at": "2025-09-03T17:34:22.916043Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.89419Z",
+          "created_at": "2025-09-03T17:34:22.957379Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.938049Z",
+          "created_at": "2025-09-03T17:34:23.00029Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.980392Z",
+          "created_at": "2025-09-03T17:34:23.043332Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.023004Z",
+          "created_at": "2025-09-03T17:34:23.085324Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.065467Z",
+          "created_at": "2025-09-03T17:34:23.128181Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.108189Z",
+          "created_at": "2025-09-03T17:34:23.172026Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,15 +147,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:36.150902Z",
+          "created_at": "2025-09-03T17:34:23.216706Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 468910417,
-          "load_duration": 93969000,
+          "total_duration": 516060000,
+          "load_duration": 127260334,
           "prompt_eval_count": 479,
-          "prompt_eval_duration": 72596750,
+          "prompt_eval_duration": 87107292,
           "eval_count": 8,
-          "eval_duration": 301590375,
+          "eval_duration": 299381042,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/c2199d6064db.json b/tests/integration/recordings/responses/c2199d6064db.json
index 73194cc00..ff7298e86 100644
--- a/tests/integration/recordings/responses/c2199d6064db.json
+++ b/tests/integration/recordings/responses/c2199d6064db.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.021827588,
-              0.08818103,
-              -0.10864717,
-              0.0027738505,
-              0.049183175,
-              -0.030155653,
-              -0.015535575,
-              0.027562236,
-              -0.025055608,
-              0.016142149,
-              0.12481904,
-              0.0027390872,
-              -0.033304155,
-              -0.007155499,
-              -0.07006565,
-              -0.028012667,
-              -0.0974939,
-              -0.09156265,
-              0.013381448,
-              0.08751534,
-              0.013976399,
-              0.036656633,
-              -0.0363098,
-              -0.019737098,
-              0.04459191,
-              -0.009628102,
-              -0.018323021,
-              0.048807826,
-              -0.015294308,
-              -0.071472056,
-              0.04096934,
-              0.08271212,
-              0.06394962,
-              0.014480425,
-              0.13194743,
-              0.030426797,
-              0.10103986,
-              -0.030337727,
-              -0.047615312,
-              0.044662375,
-              0.027032219,
-              -0.029383352,
-              0.038528103,
-              0.005350361,
-              0.014771562,
-              0.02561623,
-              0.0041866824,
-              0.0035074751,
-              0.029762248,
-              -0.036631253,
-              -0.045908086,
-              0.031111827,
-              -0.07789252,
-              -0.019519411,
-              0.053894877,
-              -0.015229676,
-              -0.0016866667,
-              0.016928526,
-              0.019906636,
-              0.071048684,
-              0.009945389,
-              0.031127382,
-              -0.010339295,
-              0.029969081,
-              0.1150558,
-              0.0257364,
-              -0.05285643,
-              -0.042424288,
-              0.00530526,
-              -0.09986522,
-              -0.12739678,
-              -0.012008937,
-              -0.013796879,
-              0.052672364,
-              -0.017240625,
-              0.009655106,
-              -0.07752442,
-              0.001446598,
-              0.06974642,
-              -0.084652565,
-              -0.06148656,
-              -0.1424512,
-              0.00971367,
-              -0.008617611,
-              -0.03184207,
-              0.12822424,
-              0.05323436,
-              0.021975016,
-              0.0026292745,
-              0.015444466,
-              -0.042529456,
-              0.031529475,
-              -0.062093526,
-              0.044023193,
-              -0.006063745,
-              0.06960859,
-              0.0050675236,
-              0.05936227,
-              0.006593922,
-              0.08395398,
-              -0.0067747384,
-              -0.041917052,
-              0.027087294,
-              0.1064389,
-              -0.03939661,
-              -0.053915743,
-              0.0969116,
-              -0.008478297,
-              0.03400473,
-              -0.033850323,
-              0.0022322247,
-              -0.08182309,
-              -0.008227045,
-              -0.112729885,
-              0.0058874753,
-              -0.09516338,
-              -0.07956543,
-              0.0528746,
-              -0.08121418,
-              0.034270033,
-              0.079010375,
-              -0.026773734,
-              -0.043880418,
-              0.0067898994,
-              -0.054401524,
-              -0.021739269,
-              0.08060149,
-              -3.9385423e-33,
-              -0.0072775874,
-              -0.07965713,
-              0.024867468,
-              0.115594625,
-              0.035952598,
-              -0.07256428,
-              0.01264772,
-              0.05078877,
-              -0.1001076,
-              0.019520493,
-              0.003609843,
-              -0.07002774,
-              0.00796547,
-              0.029297192,
-              -0.017813923,
-              0.026997875,
-              0.016828112,
-              0.035944253,
-              -0.020945141,
-              -0.032345034,
-              0.056713093,
-              -0.009717346,
-              -0.059717353,
-              -0.053816583,
-              -0.055860512,
-              0.0652541,
-              -0.024728304,
-              -0.07780815,
-              0.038602088,
-              0.008995879,
-              0.009711051,
-              -0.02800488,
-              -0.02488407,
-              -0.001753672,
-              0.025541821,
-              0.03461599,
-              3.1180356e-05,
-              0.0034299733,
-              -0.04524332,
-              0.034621477,
-              -0.025317375,
-              -0.029820684,
-              -0.019064484,
-              -0.023168772,
-              0.049378216,
-              -0.0614278,
-              0.00038631904,
-              0.0028947273,
-              0.027602436,
-              0.0069355685,
-              -0.020665208,
-              0.0607627,
-              0.015200459,
-              0.038925096,
-              -0.025373906,
-              -0.0017942133,
-              -0.019378444,
-              -0.005707356,
-              -0.01781858,
-              0.03804118,
-              0.032033492,
-              0.039991416,
-              -0.096098565,
-              0.0007088372,
-              -0.018460834,
-              -0.06865977,
-              -0.007682667,
-              -0.083552696,
-              0.10225278,
-              0.05144313,
-              -0.033060983,
-              -0.05033815,
-              0.043931242,
-              0.017761385,
-              -0.006623071,
-              -0.018680306,
-              0.012787289,
-              0.016647147,
-              -0.095078625,
-              -0.023556676,
-              0.0068797185,
-              -0.07225466,
-              -0.0030222975,
-              -0.06930809,
-              -0.027324349,
-              -0.06728827,
-              -0.0066746464,
-              -0.06802411,
-              0.044557177,
-              -0.09791178,
-              0.05094532,
-              0.010023194,
-              -0.04618695,
-              -0.067631915,
-              0.044459086,
-              2.564085e-33,
-              0.0148239555,
-              0.071699664,
-              -0.05235211,
-              0.011046101,
-              -0.01389393,
-              0.07070217,
-              0.09194932,
-              -0.019197263,
-              -0.01579352,
-              0.14807871,
-              0.03188067,
-              0.022338957,
-              0.070754,
-              -0.037077773,
-              0.08807045,
-              -0.018151604,
-              -0.013233297,
-              -0.04176197,
-              -0.05230764,
-              -0.0027928778,
-              -0.024819419,
-              0.13973284,
-              0.07498215,
-              0.05643386,
-              -0.02942886,
-              0.017126264,
-              0.03372573,
-              0.068746336,
-              0.020448433,
-              -0.018980682,
-              0.081244655,
-              0.06527421,
-              -0.09341324,
-              0.0037619828,
-              0.06348108,
-              -0.08774056,
-              0.092889525,
-              -0.024263546,
-              0.029117694,
-              0.0034306366,
-              0.055297706,
-              0.102015935,
-              -0.023556657,
-              0.065803,
-              0.015247541,
-              0.034352973,
-              0.105588056,
-              0.011606838,
-              0.04098301,
-              -0.056642916,
-              0.037729684,
-              -0.04976193,
-              0.047909457,
-              0.0042117573,
-              -0.014169,
-              0.07561971,
-              -0.0096767275,
-              0.055205546,
-              -0.031133024,
-              0.019914651,
-              -0.025017431,
-              0.031833746,
-              -0.019527186,
-              -0.009863273,
-              -0.020237885,
-              -0.033213306,
-              -0.026289295,
-              0.038861252,
-              0.012964407,
-              -0.041289695,
-              0.012831493,
-              0.028716395,
-              -0.054101057,
-              -0.07626151,
-              0.021948934,
-              -0.023362676,
-              -0.026700463,
-              -0.029420532,
-              0.0052917786,
-              0.012322609,
-              0.052309964,
-              0.005428001,
-              -0.0063846395,
-              0.046033006,
-              0.042387757,
-              -0.018442502,
-              0.012625506,
-              0.093027025,
-              -0.0059689214,
-              -0.015190377,
-              -0.011668946,
-              0.048090797,
-              0.025912488,
-              0.050898798,
-              0.005562451,
-              -1.5056784e-08,
-              -0.030993447,
-              -0.07005236,
-              -0.032605737,
-              -0.00874509,
-              -0.004551062,
-              0.07593507,
-              -0.032746524,
-              -0.08790053,
-              -0.032251474,
-              -0.024588991,
-              0.051248234,
-              -0.0345528,
-              -0.08264784,
-              0.013345202,
-              -0.020562632,
-              -0.05624872,
-              -0.009445643,
-              -0.015907064,
-              -0.036610577,
-              0.010109376,
-              -0.0343682,
-              0.0315048,
-              -0.00014384133,
-              0.010448328,
-              0.017060373,
-              0.015475448,
-              0.074810885,
-              0.07080812,
-              -0.050022244,
-              -0.047005255,
-              0.013738294,
-              0.060728636,
-              -0.009370956,
-              -0.015692767,
-              -0.01834865,
-              0.12297243,
-              0.11857768,
-              0.123661466,
-              0.022802081,
-              -0.019996397,
-              -0.07401723,
-              -0.004714934,
-              -0.02488245,
-              0.006072489,
-              -0.066606365,
-              -0.081319734,
-              -0.08740771,
-              -0.06348687,
-              -0.039211858,
-              -0.11271469,
-              -0.030644065,
-              0.026577946,
-              -0.06322251,
-              0.042043004,
-              -0.03901968,
-              -0.009200455,
-              0.0050292667,
-              0.001581719,
-              -0.058653522,
-              0.04309485,
-              0.066819645,
-              0.062200524,
-              0.021176148,
-              -0.04108276
+              -0.021802,
+              0.088129535,
+              -0.10867403,
+              0.0027561262,
+              0.04917365,
+              -0.030165128,
+              -0.0155558735,
+              0.027549915,
+              -0.025064131,
+              0.016137881,
+              0.124836035,
+              0.0027821937,
+              -0.033310093,
+              -0.0071708336,
+              -0.07004796,
+              -0.027996853,
+              -0.09748515,
+              -0.091607764,
+              0.013367206,
+              0.08752305,
+              0.013990884,
+              0.03663788,
+              -0.036330026,
+              -0.019752761,
+              0.04456914,
+              -0.009629443,
+              -0.01832647,
+              0.048832405,
+              -0.015315298,
+              -0.07147843,
+              0.04094573,
+              0.082709365,
+              0.063961774,
+              0.01448001,
+              0.13194442,
+              0.0303949,
+              0.101027474,
+              -0.030359762,
+              -0.047630757,
+              0.044637363,
+              0.027034018,
+              -0.029368822,
+              0.038537122,
+              0.0053882804,
+              0.01478374,
+              0.025617138,
+              0.0041860593,
+              0.0034900715,
+              0.029765956,
+              -0.036669906,
+              -0.04589116,
+              0.031120853,
+              -0.07786974,
+              -0.019517597,
+              0.053876307,
+              -0.0152282175,
+              -0.0016955235,
+              0.016938528,
+              0.019939963,
+              0.07106882,
+              0.009938938,
+              0.03114348,
+              -0.010335175,
+              0.029952966,
+              0.115054145,
+              0.025746102,
+              -0.052842245,
+              -0.042447682,
+              0.0053093657,
+              -0.09987591,
+              -0.12741813,
+              -0.012022532,
+              -0.013787561,
+              0.05265948,
+              -0.01723935,
+              0.009638554,
+              -0.0775266,
+              0.0014047497,
+              0.06974368,
+              -0.08465856,
+              -0.061480872,
+              -0.14244927,
+              0.0096944375,
+              -0.008611519,
+              -0.0318523,
+              0.12823504,
+              0.053257603,
+              0.021978743,
+              0.0026468195,
+              0.015444479,
+              -0.042528655,
+              0.031551417,
+              -0.06209267,
+              0.044017885,
+              -0.0060390937,
+              0.06959196,
+              0.0050514904,
+              0.059341036,
+              0.00658094,
+              0.08397857,
+              -0.0067914296,
+              -0.041901726,
+              0.027081704,
+              0.106456675,
+              -0.039408114,
+              -0.053899165,
+              0.09689717,
+              -0.0084604705,
+              0.03398384,
+              -0.033843804,
+              0.002225838,
+              -0.08180734,
+              -0.008216738,
+              -0.11271415,
+              0.0058824755,
+              -0.095151186,
+              -0.07958445,
+              0.052868627,
+              -0.08120183,
+              0.034291897,
+              0.07903789,
+              -0.02675632,
+              -0.04391073,
+              0.0067707864,
+              -0.05438546,
+              -0.021719433,
+              0.080597855,
+              -3.9388086e-33,
+              -0.0072714644,
+              -0.079664536,
+              0.024838887,
+              0.115598045,
+              0.03591746,
+              -0.07254434,
+              0.012642099,
+              0.050809097,
+              -0.100082524,
+              0.019521356,
+              0.0035883472,
+              -0.07001022,
+              0.007977421,
+              0.029305879,
+              -0.017785804,
+              0.02702277,
+              0.016827941,
+              0.035956737,
+              -0.0209356,
+              -0.032321777,
+              0.056705642,
+              -0.009747762,
+              -0.059722506,
+              -0.053817417,
+              -0.055837773,
+              0.06526892,
+              -0.024752634,
+              -0.07778206,
+              0.038636208,
+              0.008998632,
+              0.009699391,
+              -0.02798574,
+              -0.024878206,
+              -0.0017547129,
+              0.025541965,
+              0.034623418,
+              -8.975541e-06,
+              0.0034556785,
+              -0.04525613,
+              0.03461154,
+              -0.025307115,
+              -0.02981576,
+              -0.019071916,
+              -0.023184983,
+              0.049324982,
+              -0.061433185,
+              0.00038017757,
+              0.0028894164,
+              0.027610173,
+              0.0069347974,
+              -0.020659719,
+              0.060771395,
+              0.015200205,
+              0.038918514,
+              -0.025353896,
+              -0.0017897633,
+              -0.019378036,
+              -0.0056970986,
+              -0.017806012,
+              0.038060427,
+              0.0320353,
+              0.03998783,
+              -0.09612384,
+              0.0006942505,
+              -0.018478483,
+              -0.06866618,
+              -0.0077035497,
+              -0.083554305,
+              0.10223985,
+              0.05141575,
+              -0.033018276,
+              -0.05033401,
+              0.043923385,
+              0.017748218,
+              -0.006601344,
+              -0.018691983,
+              0.012763011,
+              0.016694913,
+              -0.095070764,
+              -0.023533016,
+              0.006879241,
+              -0.07225332,
+              -0.0029991802,
+              -0.06930797,
+              -0.027289826,
+              -0.0672911,
+              -0.006683099,
+              -0.06801406,
+              0.04452207,
+              -0.09788058,
+              0.050909285,
+              0.010051549,
+              -0.04617998,
+              -0.067622505,
+              0.04447288,
+              2.5643933e-33,
+              0.014783131,
+              0.071710624,
+              -0.05237768,
+              0.011041238,
+              -0.013921518,
+              0.07072471,
+              0.091977395,
+              -0.01916791,
+              -0.015780058,
+              0.14812021,
+              0.031904023,
+              0.022344623,
+              0.07071857,
+              -0.037060503,
+              0.08806883,
+              -0.018145561,
+              -0.013254877,
+              -0.041782882,
+              -0.052317847,
+              -0.00279131,
+              -0.024807084,
+              0.13974102,
+              0.074973755,
+              0.056424167,
+              -0.029412953,
+              0.017093861,
+              0.03373144,
+              0.06874087,
+              0.020454561,
+              -0.018965451,
+              0.081238694,
+              0.06527906,
+              -0.09342225,
+              0.0037720343,
+              0.06347132,
+              -0.08775714,
+              0.09286548,
+              -0.024266576,
+              0.029101077,
+              0.0034162905,
+              0.05528427,
+              0.102037616,
+              -0.023588225,
+              0.065829135,
+              0.01520327,
+              0.034344077,
+              0.10559419,
+              0.011605323,
+              0.0409873,
+              -0.056635953,
+              0.037730522,
+              -0.04976337,
+              0.047961522,
+              0.0042118295,
+              -0.014172872,
+              0.07564937,
+              -0.009671058,
+              0.05520304,
+              -0.031121492,
+              0.019924358,
+              -0.024975697,
+              0.031822197,
+              -0.019536836,
+              -0.009870229,
+              -0.020225972,
+              -0.03319855,
+              -0.026266782,
+              0.038882248,
+              0.012940086,
+              -0.041266225,
+              0.012833021,
+              0.028703777,
+              -0.054075323,
+              -0.07628176,
+              0.021953572,
+              -0.023357453,
+              -0.026714878,
+              -0.029401133,
+              0.005280363,
+              0.012325193,
+              0.05232579,
+              0.0054451786,
+              -0.0063759633,
+              0.04604998,
+              0.042399842,
+              -0.018433316,
+              0.01260558,
+              0.09300185,
+              -0.005949781,
+              -0.015193224,
+              -0.011673769,
+              0.048114438,
+              0.02588804,
+              0.050943956,
+              0.005536351,
+              -1.5059804e-08,
+              -0.03100338,
+              -0.07003323,
+              -0.032613333,
+              -0.008732137,
+              -0.0045523546,
+              0.0759239,
+              -0.032725554,
+              -0.08790561,
+              -0.032228027,
+              -0.02459868,
+              0.051224917,
+              -0.034561895,
+              -0.08266327,
+              0.013319846,
+              -0.020541467,
+              -0.056271035,
+              -0.009450659,
+              -0.015903467,
+              -0.036625408,
+              0.010096497,
+              -0.03440534,
+              0.0315293,
+              -0.00013937108,
+              0.010463861,
+              0.017065981,
+              0.015492903,
+              0.074808784,
+              0.07079003,
+              -0.050000764,
+              -0.047017526,
+              0.01375958,
+              0.060757488,
+              -0.009361379,
+              -0.01570009,
+              -0.01836736,
+              0.12301148,
+              0.1185397,
+              0.12366319,
+              0.022782512,
+              -0.020027133,
+              -0.07401259,
+              -0.0047104736,
+              -0.024872223,
+              0.006070436,
+              -0.06660639,
+              -0.08130306,
+              -0.0873992,
+              -0.0634906,
+              -0.039198957,
+              -0.11274462,
+              -0.030654918,
+              0.026607778,
+              -0.063220546,
+              0.042023618,
+              -0.039010853,
+              -0.009214424,
+              0.005044682,
+              0.0015641748,
+              -0.058640927,
+              0.043107104,
+              0.06682025,
+              0.062172387,
+              0.021147223,
+              -0.041068073
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/c9cba6f3ee38.json b/tests/integration/recordings/responses/c9cba6f3ee38.json
index 488ac6563..02363c70e 100644
--- a/tests/integration/recordings/responses/c9cba6f3ee38.json
+++ b/tests/integration/recordings/responses/c9cba6f3ee38.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:14:21.909783Z",
+        "created_at": "2025-09-03T17:38:03.002753Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 311036333,
-        "load_duration": 37569542,
+        "total_duration": 334941166,
+        "load_duration": 149512166,
         "prompt_eval_count": 219,
-        "prompt_eval_duration": 259000000,
+        "prompt_eval_duration": 173843500,
         "eval_count": 2,
-        "eval_duration": 12000000,
+        "eval_duration": 11119166,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/cb3df2a1dc22.json b/tests/integration/recordings/responses/cb3df2a1dc22.json
index d65945ac1..41db65a5e 100644
--- a/tests/integration/recordings/responses/cb3df2a1dc22.json
+++ b/tests/integration/recordings/responses/cb3df2a1dc22.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-877",
+        "id": "chatcmpl-271",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "I'm not capable of directly testing the functionality of external systems like Telemetry. However, I can provide you with some general information about creating telemetry data and offer suggestions on how to set up a basic telemetry system.\r\n\r\nTelemetry is the automatic measurement, reporting, and transmission of data from sensors or other devices. In the context of OpenAI, telemetry refers to the collection and analysis of data related to the company's products and services.\r\n\r\nTo create telemetry creation using the OpenAI APIs you would need to follow these steps:\r\n\r\n1. Register for an OpenAI account and get an access token.\r\n2. Choose the OpenAI API that you want to use (e.g., GPT-3).\r\n3. Create a new file or project in your preferred programming language or framework.\r\n4. Import the necessary libraries and modules to interact with the OpenAI API.\r\n5. Use the OpenAI API to create and send telemetry data.\r\n\r\nHere is an example of how you might create a basic telemetry system using Python and the OpenAI GPT-3 API:\r\n\r\n```python\r\nimport os\r\nimport json\r\n\r\n# Set your OpenAI access token\r\naccess_token = \"YOUR_OPENAI_ACCESS_TOKEN\"\r\n\r\n# Define the telemetry data\r\ntelemetry_data = {\r\n    \"name\": \"example-telemetry\",\r\n    \"description\": \"Example telemetry data.\r\n\r\n    # Define the telemetry metrics\r\n    \"metrics\": [\r\n        {\"key\": \"users\", \"value\": 100},\r\n        {\"key\": \" engagement\", \"value\": 20}\r\n    ]\r\n}\r\n\r\n# Convert the telemetry data to JSON\r\ntelemetry_json = json.dumps(telemetry_data)\r\n\r\n# Set the OpenAI API endpoint and headers\r\napi_endpoint = \"https://api.openai.com/v1/telemetry\"\r\nheaders = {\r\n    \"Authorization\": f\"Bearer {access_token}\",\r\n    \"Content-Type\": \"application/json\"\r\n}\r\n\r\n# Send the telemetry data to the OpenAI API\r\nimport requests\r\n\r\nresponse = requests.post(api_endpoint, headers=headers, data=telemetry_json)\r\n\r\n# Check if the request was successful\r\nif response.status_code == 200:\r\n    print(\"Telemetry data sent successfully\")\r\nelse:\r\n    print(\"Error sending telemetry data\")\r\n```\n\nPlease note that this is a basic example and you should adjust it according to your needs. Also, the specific implementation details may vary depending on the OpenAI API you're using and the programming language or framework you're working with.\r\n\r\nI hope this helps! Let me know if you have any further questions.",
+              "content": "# OpenAI Telemetry Creation Testing\n\nThis guide provides a test environment for creating and analyzing telemetries using the OpenAI API.\n\n## Prerequisites\n\n-   Python 3.8 or higher\n-   `requests` library\n-   An OpenAI API key (create an account on the [OpenAI website](https://openai.com/))\n\n## Step 1: Install Required Libraries\n\nFirst, install the required libraries by running the following command in your terminal:\n\n```bash\npip install requests\n```\n\n## Step 2: Create a Telemetry Object\n\nCreate a new Python file (e.g., `telemetry.py`) and import the required library. Define a telemetry object with the relevant data:\n\n```python\n# Import the requests library\nimport requests\n\nclass Telemetry:\n    def __init__(self, api_key):\n        \"\"\"\n        Initialize the telemetry object.\n\n        Args:\n            api_key (str): The OpenAI API key.\n        \"\"\"\n\n        self.api_key = api_key\n\n    def create_telemetry(self, id, data):\n        \"\"\"\n        Create a new telemetry entry using the OpenAI API.\n\n        Args:\n            id (str): The ID of the model or dataset.\n            data (dict): The telemetry data to be created.\n\n        Returns:\n            dict: The response from the OpenAI API.\n\n        Raises:\n            ValueError: If the request fails.\n        \"\"\"\n\n        url = f\"https://api.openai.com/v1/models/{id}/telemetry\"\n\n        headers = {\n            \"Authorization\": self.api_key,\n            \"Content-Type\": \"application/json\",\n        }\n\n        telemetry_data = {\"events\": data}\n\n        response = requests.post(url, json=telemetry_data, headers=headers)\n\n        if not response.ok:\n            raise ValueError(\"Failed to create telemetry\")\n\n        return response.json()\n```\n\n## Step 3: Usage Example\n\nHere's an example usage of the `Telemetry` class:\n\n```python\n# Create a new Telemetry object with your OpenAI API key\ntelemetry = Telemetry(\n    \"YOUR_OPENAI_API_KEY_HERE\"\n)\n\n# Define the telemetry data\ndata = {\"event\": \"example_event\"}\n\n# Create a new telemetry entry\nid = \"my_model_id\"  # Replace with your model or dataset ID\n\ntry:\n    result = telemetry.create_telemetry(id, data)\n    print(result)\nexcept ValueError as e:\n    print(e)\n```\n\nThis code creates a new `Telemetry` object, defines some sample telemetry data, and uses the `create_telemetry` method to create a new telemetry entry. The response from the OpenAI API is printed out.\n\nNote: Replace `\"YOUR_OPENAI_API_KEY_HERE\"` with your actual OpenAI API key.\n\n## Conclusion\n\nThis guide provides a basic example of how to create telemetries using the OpenAI API. You can modify the code and implement additional features as needed for your project.\n\nStay updated on our latest tutorials and guides:\n\n*   [Check out our Discord channel](link): https://discord.gg/openai-exists\n\nHappy coding!",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,15 +37,15 @@
             }
           }
         ],
-        "created": 1754510083,
+        "created": 1756921299,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 505,
+          "completion_tokens": 633,
           "prompt_tokens": 30,
-          "total_tokens": 535,
+          "total_tokens": 663,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/cd094caaf1c0.json b/tests/integration/recordings/responses/cd094caaf1c0.json
index c0b3873d3..70a3d334d 100644
--- a/tests/integration/recordings/responses/cd094caaf1c0.json
+++ b/tests/integration/recordings/responses/cd094caaf1c0.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:14.822116Z",
+          "created_at": "2025-09-03T17:36:21.138019Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:14.874482Z",
+          "created_at": "2025-09-03T17:36:21.179853Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:14.926533Z",
+          "created_at": "2025-09-03T17:36:21.220635Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:14.980659Z",
+          "created_at": "2025-09-03T17:36:21.261418Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.036126Z",
+          "created_at": "2025-09-03T17:36:21.301991Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.087015Z",
+          "created_at": "2025-09-03T17:36:21.3425Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.137306Z",
+          "created_at": "2025-09-03T17:36:21.38302Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.189129Z",
+          "created_at": "2025-09-03T17:36:21.423862Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,7 +165,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.240264Z",
+          "created_at": "2025-09-03T17:36:21.464611Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -183,7 +183,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.291201Z",
+          "created_at": "2025-09-03T17:36:21.505714Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -201,7 +201,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.341476Z",
+          "created_at": "2025-09-03T17:36:21.547075Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -219,7 +219,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.39284Z",
+          "created_at": "2025-09-03T17:36:21.588896Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -237,7 +237,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.44438Z",
+          "created_at": "2025-09-03T17:36:21.629146Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -255,7 +255,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.497561Z",
+          "created_at": "2025-09-03T17:36:21.669722Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -273,7 +273,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.550461Z",
+          "created_at": "2025-09-03T17:36:21.710707Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -291,7 +291,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.599866Z",
+          "created_at": "2025-09-03T17:36:21.751267Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -309,7 +309,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.651899Z",
+          "created_at": "2025-09-03T17:36:21.791565Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -327,7 +327,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.702896Z",
+          "created_at": "2025-09-03T17:36:21.83176Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -345,7 +345,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.75492Z",
+          "created_at": "2025-09-03T17:36:21.872029Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -363,7 +363,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.805824Z",
+          "created_at": "2025-09-03T17:36:21.914066Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -381,7 +381,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.8564Z",
+          "created_at": "2025-09-03T17:36:21.955317Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -399,7 +399,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.907374Z",
+          "created_at": "2025-09-03T17:36:21.995588Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -417,7 +417,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:15.959599Z",
+          "created_at": "2025-09-03T17:36:22.03605Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -435,7 +435,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.012545Z",
+          "created_at": "2025-09-03T17:36:22.076924Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -453,7 +453,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.065508Z",
+          "created_at": "2025-09-03T17:36:22.117922Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -471,7 +471,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.122471Z",
+          "created_at": "2025-09-03T17:36:22.158925Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -489,7 +489,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.175606Z",
+          "created_at": "2025-09-03T17:36:22.199113Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -507,7 +507,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.227171Z",
+          "created_at": "2025-09-03T17:36:22.239797Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -525,7 +525,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.278522Z",
+          "created_at": "2025-09-03T17:36:22.280592Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -543,7 +543,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.329492Z",
+          "created_at": "2025-09-03T17:36:22.321607Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -561,7 +561,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.381232Z",
+          "created_at": "2025-09-03T17:36:22.36237Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -579,7 +579,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.43463Z",
+          "created_at": "2025-09-03T17:36:22.402735Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -597,7 +597,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.483135Z",
+          "created_at": "2025-09-03T17:36:22.44328Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -615,7 +615,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.544729Z",
+          "created_at": "2025-09-03T17:36:22.48369Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -633,7 +633,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.605218Z",
+          "created_at": "2025-09-03T17:36:22.524383Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -651,7 +651,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.660652Z",
+          "created_at": "2025-09-03T17:36:22.564975Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -669,7 +669,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.718606Z",
+          "created_at": "2025-09-03T17:36:22.605886Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -687,7 +687,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.772786Z",
+          "created_at": "2025-09-03T17:36:22.646199Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -705,7 +705,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.826904Z",
+          "created_at": "2025-09-03T17:36:22.686594Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -723,7 +723,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.878735Z",
+          "created_at": "2025-09-03T17:36:22.726941Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -741,7 +741,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.931262Z",
+          "created_at": "2025-09-03T17:36:22.767696Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -759,7 +759,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:16.984266Z",
+          "created_at": "2025-09-03T17:36:22.810962Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -777,7 +777,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.035518Z",
+          "created_at": "2025-09-03T17:36:22.851903Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -795,7 +795,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.084669Z",
+          "created_at": "2025-09-03T17:36:22.892412Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -813,7 +813,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.138856Z",
+          "created_at": "2025-09-03T17:36:22.932877Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -831,7 +831,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.19578Z",
+          "created_at": "2025-09-03T17:36:22.973247Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -849,7 +849,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.254009Z",
+          "created_at": "2025-09-03T17:36:23.013989Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -867,7 +867,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.307391Z",
+          "created_at": "2025-09-03T17:36:23.054251Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -885,7 +885,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.363223Z",
+          "created_at": "2025-09-03T17:36:23.094676Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -903,7 +903,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.420075Z",
+          "created_at": "2025-09-03T17:36:23.135452Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -921,7 +921,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.475276Z",
+          "created_at": "2025-09-03T17:36:23.176336Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -939,7 +939,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.529886Z",
+          "created_at": "2025-09-03T17:36:23.216888Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -957,7 +957,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.587218Z",
+          "created_at": "2025-09-03T17:36:23.257355Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -975,7 +975,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.640408Z",
+          "created_at": "2025-09-03T17:36:23.297487Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -993,7 +993,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.692792Z",
+          "created_at": "2025-09-03T17:36:23.337777Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1011,7 +1011,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.746336Z",
+          "created_at": "2025-09-03T17:36:23.37817Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1029,7 +1029,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.801383Z",
+          "created_at": "2025-09-03T17:36:23.418119Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1047,7 +1047,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.854621Z",
+          "created_at": "2025-09-03T17:36:23.458074Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1065,7 +1065,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.911212Z",
+          "created_at": "2025-09-03T17:36:23.498828Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1083,7 +1083,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:17.970851Z",
+          "created_at": "2025-09-03T17:36:23.539337Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1101,7 +1101,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.025592Z",
+          "created_at": "2025-09-03T17:36:23.579947Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1119,7 +1119,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.084169Z",
+          "created_at": "2025-09-03T17:36:23.620572Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1137,7 +1137,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.142748Z",
+          "created_at": "2025-09-03T17:36:23.661884Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1155,7 +1155,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.198201Z",
+          "created_at": "2025-09-03T17:36:23.703234Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1173,7 +1173,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.247029Z",
+          "created_at": "2025-09-03T17:36:23.743994Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1191,7 +1191,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.298673Z",
+          "created_at": "2025-09-03T17:36:23.784238Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1209,7 +1209,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.346985Z",
+          "created_at": "2025-09-03T17:36:23.824425Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1227,7 +1227,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.396338Z",
+          "created_at": "2025-09-03T17:36:23.864711Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1245,7 +1245,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.44707Z",
+          "created_at": "2025-09-03T17:36:23.904729Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1263,7 +1263,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.500596Z",
+          "created_at": "2025-09-03T17:36:23.944762Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1281,7 +1281,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.552919Z",
+          "created_at": "2025-09-03T17:36:23.985199Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1299,7 +1299,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.605569Z",
+          "created_at": "2025-09-03T17:36:24.025821Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1317,7 +1317,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.657753Z",
+          "created_at": "2025-09-03T17:36:24.066639Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1335,7 +1335,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.712933Z",
+          "created_at": "2025-09-03T17:36:24.109215Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1353,7 +1353,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.765708Z",
+          "created_at": "2025-09-03T17:36:24.15123Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1371,7 +1371,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.81852Z",
+          "created_at": "2025-09-03T17:36:24.192856Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1389,7 +1389,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.870752Z",
+          "created_at": "2025-09-03T17:36:24.23433Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1407,7 +1407,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.922652Z",
+          "created_at": "2025-09-03T17:36:24.275212Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1425,7 +1425,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:18.974032Z",
+          "created_at": "2025-09-03T17:36:24.315722Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1443,7 +1443,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.025272Z",
+          "created_at": "2025-09-03T17:36:24.355996Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1461,7 +1461,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.076061Z",
+          "created_at": "2025-09-03T17:36:24.396181Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1479,7 +1479,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.126893Z",
+          "created_at": "2025-09-03T17:36:24.43716Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1497,7 +1497,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.179123Z",
+          "created_at": "2025-09-03T17:36:24.478009Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1515,7 +1515,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.230189Z",
+          "created_at": "2025-09-03T17:36:24.519697Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1533,7 +1533,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.280582Z",
+          "created_at": "2025-09-03T17:36:24.562228Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1551,7 +1551,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.330127Z",
+          "created_at": "2025-09-03T17:36:24.604366Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1569,7 +1569,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.379656Z",
+          "created_at": "2025-09-03T17:36:24.645258Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1587,7 +1587,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.430197Z",
+          "created_at": "2025-09-03T17:36:24.686966Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1605,7 +1605,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.48034Z",
+          "created_at": "2025-09-03T17:36:24.726702Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1623,7 +1623,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.530546Z",
+          "created_at": "2025-09-03T17:36:24.766742Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1641,7 +1641,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.583294Z",
+          "created_at": "2025-09-03T17:36:24.806841Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1659,7 +1659,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.630956Z",
+          "created_at": "2025-09-03T17:36:24.846655Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1677,7 +1677,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.682434Z",
+          "created_at": "2025-09-03T17:36:24.886602Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1695,7 +1695,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.731714Z",
+          "created_at": "2025-09-03T17:36:24.926582Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1713,7 +1713,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.780871Z",
+          "created_at": "2025-09-03T17:36:24.966301Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1731,7 +1731,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.829955Z",
+          "created_at": "2025-09-03T17:36:25.006614Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1749,7 +1749,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.880971Z",
+          "created_at": "2025-09-03T17:36:25.046631Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1767,7 +1767,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.931241Z",
+          "created_at": "2025-09-03T17:36:25.086885Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1785,7 +1785,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:19.980096Z",
+          "created_at": "2025-09-03T17:36:25.127555Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1803,7 +1803,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.03407Z",
+          "created_at": "2025-09-03T17:36:25.168437Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1821,7 +1821,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.090735Z",
+          "created_at": "2025-09-03T17:36:25.20913Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1839,7 +1839,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.153924Z",
+          "created_at": "2025-09-03T17:36:25.249991Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1857,7 +1857,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.220305Z",
+          "created_at": "2025-09-03T17:36:25.29007Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1875,7 +1875,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.304523Z",
+          "created_at": "2025-09-03T17:36:25.331038Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1893,7 +1893,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.4249Z",
+          "created_at": "2025-09-03T17:36:25.37155Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1911,7 +1911,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.483091Z",
+          "created_at": "2025-09-03T17:36:25.413816Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1929,7 +1929,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.552198Z",
+          "created_at": "2025-09-03T17:36:25.457114Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1947,7 +1947,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.651684Z",
+          "created_at": "2025-09-03T17:36:25.49976Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1965,7 +1965,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.767844Z",
+          "created_at": "2025-09-03T17:36:25.540794Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1983,7 +1983,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.836273Z",
+          "created_at": "2025-09-03T17:36:25.581085Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2001,7 +2001,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.919729Z",
+          "created_at": "2025-09-03T17:36:25.62194Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2019,7 +2019,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:20.987772Z",
+          "created_at": "2025-09-03T17:36:25.66242Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2037,7 +2037,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.0516Z",
+          "created_at": "2025-09-03T17:36:25.702827Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2055,7 +2055,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.118611Z",
+          "created_at": "2025-09-03T17:36:25.743383Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2073,7 +2073,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.182092Z",
+          "created_at": "2025-09-03T17:36:25.785523Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2091,7 +2091,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.241399Z",
+          "created_at": "2025-09-03T17:36:25.828276Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2109,7 +2109,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.296699Z",
+          "created_at": "2025-09-03T17:36:25.871231Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2127,7 +2127,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.355772Z",
+          "created_at": "2025-09-03T17:36:25.913246Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2145,7 +2145,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.410821Z",
+          "created_at": "2025-09-03T17:36:25.955162Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2163,7 +2163,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.46582Z",
+          "created_at": "2025-09-03T17:36:25.997821Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2181,7 +2181,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.520896Z",
+          "created_at": "2025-09-03T17:36:26.03971Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2199,7 +2199,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.58943Z",
+          "created_at": "2025-09-03T17:36:26.082988Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2217,7 +2217,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.700526Z",
+          "created_at": "2025-09-03T17:36:26.126136Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2235,7 +2235,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.772492Z",
+          "created_at": "2025-09-03T17:36:26.168484Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2253,7 +2253,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.839261Z",
+          "created_at": "2025-09-03T17:36:26.210934Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2271,7 +2271,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.90185Z",
+          "created_at": "2025-09-03T17:36:26.25385Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2289,7 +2289,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:21.96248Z",
+          "created_at": "2025-09-03T17:36:26.295017Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2307,7 +2307,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.024705Z",
+          "created_at": "2025-09-03T17:36:26.335776Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2325,7 +2325,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.079411Z",
+          "created_at": "2025-09-03T17:36:26.377421Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2343,7 +2343,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.132835Z",
+          "created_at": "2025-09-03T17:36:26.419324Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2361,7 +2361,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.189848Z",
+          "created_at": "2025-09-03T17:36:26.460598Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2379,7 +2379,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.252016Z",
+          "created_at": "2025-09-03T17:36:26.502926Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2397,7 +2397,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.316246Z",
+          "created_at": "2025-09-03T17:36:26.545467Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2415,7 +2415,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.384612Z",
+          "created_at": "2025-09-03T17:36:26.587384Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2433,7 +2433,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.444066Z",
+          "created_at": "2025-09-03T17:36:26.628641Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2451,7 +2451,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.50686Z",
+          "created_at": "2025-09-03T17:36:26.669783Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2469,7 +2469,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.562225Z",
+          "created_at": "2025-09-03T17:36:26.710862Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2487,7 +2487,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.621013Z",
+          "created_at": "2025-09-03T17:36:26.751949Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2505,7 +2505,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.682489Z",
+          "created_at": "2025-09-03T17:36:26.793375Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2523,7 +2523,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.754211Z",
+          "created_at": "2025-09-03T17:36:26.835697Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2541,7 +2541,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.813395Z",
+          "created_at": "2025-09-03T17:36:26.876139Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2559,7 +2559,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.872143Z",
+          "created_at": "2025-09-03T17:36:26.917322Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2577,7 +2577,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.930176Z",
+          "created_at": "2025-09-03T17:36:26.958405Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2595,7 +2595,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:22.989936Z",
+          "created_at": "2025-09-03T17:36:26.999602Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2613,7 +2613,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.052675Z",
+          "created_at": "2025-09-03T17:36:27.041369Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2631,7 +2631,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.116141Z",
+          "created_at": "2025-09-03T17:36:27.082117Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2649,7 +2649,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.171904Z",
+          "created_at": "2025-09-03T17:36:27.124286Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2667,7 +2667,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.226341Z",
+          "created_at": "2025-09-03T17:36:27.165354Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2685,7 +2685,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.279164Z",
+          "created_at": "2025-09-03T17:36:27.206517Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2703,7 +2703,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.331167Z",
+          "created_at": "2025-09-03T17:36:27.247418Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2721,7 +2721,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.3852Z",
+          "created_at": "2025-09-03T17:36:27.288727Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2739,7 +2739,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.441499Z",
+          "created_at": "2025-09-03T17:36:27.32952Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2757,7 +2757,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.495317Z",
+          "created_at": "2025-09-03T17:36:27.37057Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2775,7 +2775,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.55017Z",
+          "created_at": "2025-09-03T17:36:27.413166Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2793,7 +2793,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.600579Z",
+          "created_at": "2025-09-03T17:36:27.453878Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2811,7 +2811,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.654506Z",
+          "created_at": "2025-09-03T17:36:27.495693Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2829,7 +2829,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.709135Z",
+          "created_at": "2025-09-03T17:36:27.536879Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2847,7 +2847,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.760466Z",
+          "created_at": "2025-09-03T17:36:27.578071Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2865,7 +2865,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.813218Z",
+          "created_at": "2025-09-03T17:36:27.619459Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2883,7 +2883,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.865353Z",
+          "created_at": "2025-09-03T17:36:27.660329Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2901,7 +2901,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.922629Z",
+          "created_at": "2025-09-03T17:36:27.701195Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2919,7 +2919,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:23.975942Z",
+          "created_at": "2025-09-03T17:36:27.74184Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2937,7 +2937,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.028952Z",
+          "created_at": "2025-09-03T17:36:27.782435Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2955,7 +2955,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.086171Z",
+          "created_at": "2025-09-03T17:36:27.822698Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2973,7 +2973,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.145184Z",
+          "created_at": "2025-09-03T17:36:27.863482Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2991,7 +2991,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.201279Z",
+          "created_at": "2025-09-03T17:36:27.904189Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3009,7 +3009,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.255619Z",
+          "created_at": "2025-09-03T17:36:27.944927Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3027,7 +3027,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.311758Z",
+          "created_at": "2025-09-03T17:36:27.985583Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3045,7 +3045,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.369104Z",
+          "created_at": "2025-09-03T17:36:28.026811Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3063,7 +3063,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.423674Z",
+          "created_at": "2025-09-03T17:36:28.067929Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3081,7 +3081,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.47792Z",
+          "created_at": "2025-09-03T17:36:28.108844Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3099,7 +3099,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.531093Z",
+          "created_at": "2025-09-03T17:36:28.149655Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3117,7 +3117,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.582555Z",
+          "created_at": "2025-09-03T17:36:28.190377Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3135,7 +3135,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.63568Z",
+          "created_at": "2025-09-03T17:36:28.230919Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3153,7 +3153,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.689009Z",
+          "created_at": "2025-09-03T17:36:28.271506Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3171,7 +3171,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.742834Z",
+          "created_at": "2025-09-03T17:36:28.313533Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3189,7 +3189,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.79443Z",
+          "created_at": "2025-09-03T17:36:28.356508Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3207,7 +3207,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.845937Z",
+          "created_at": "2025-09-03T17:36:28.397379Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3225,7 +3225,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.896501Z",
+          "created_at": "2025-09-03T17:36:28.438016Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3243,7 +3243,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:24.952958Z",
+          "created_at": "2025-09-03T17:36:28.47858Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3261,7 +3261,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.009085Z",
+          "created_at": "2025-09-03T17:36:28.519407Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3279,7 +3279,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.067495Z",
+          "created_at": "2025-09-03T17:36:28.560412Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3297,7 +3297,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.121739Z",
+          "created_at": "2025-09-03T17:36:28.601727Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3315,7 +3315,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.172013Z",
+          "created_at": "2025-09-03T17:36:28.64332Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3333,7 +3333,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.222982Z",
+          "created_at": "2025-09-03T17:36:28.683692Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3351,7 +3351,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.274019Z",
+          "created_at": "2025-09-03T17:36:28.724325Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3369,7 +3369,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.324668Z",
+          "created_at": "2025-09-03T17:36:28.764731Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3387,7 +3387,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.377987Z",
+          "created_at": "2025-09-03T17:36:28.805214Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3405,7 +3405,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.429358Z",
+          "created_at": "2025-09-03T17:36:28.845962Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3423,7 +3423,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.481004Z",
+          "created_at": "2025-09-03T17:36:28.886874Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3441,7 +3441,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.534764Z",
+          "created_at": "2025-09-03T17:36:28.927442Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3459,7 +3459,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.587324Z",
+          "created_at": "2025-09-03T17:36:28.967837Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3477,7 +3477,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.639379Z",
+          "created_at": "2025-09-03T17:36:29.008786Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3495,7 +3495,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.692618Z",
+          "created_at": "2025-09-03T17:36:29.049817Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3513,7 +3513,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.74473Z",
+          "created_at": "2025-09-03T17:36:29.090455Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3531,7 +3531,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.803002Z",
+          "created_at": "2025-09-03T17:36:29.131723Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3549,7 +3549,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.858781Z",
+          "created_at": "2025-09-03T17:36:29.172582Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3567,7 +3567,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.916114Z",
+          "created_at": "2025-09-03T17:36:29.214861Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3585,7 +3585,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:25.968791Z",
+          "created_at": "2025-09-03T17:36:29.256056Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3603,7 +3603,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.023195Z",
+          "created_at": "2025-09-03T17:36:29.296825Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3621,7 +3621,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.076958Z",
+          "created_at": "2025-09-03T17:36:29.337822Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3639,7 +3639,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.128711Z",
+          "created_at": "2025-09-03T17:36:29.378894Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3657,7 +3657,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.187987Z",
+          "created_at": "2025-09-03T17:36:29.419586Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3675,7 +3675,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.241555Z",
+          "created_at": "2025-09-03T17:36:29.459743Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3693,7 +3693,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.292588Z",
+          "created_at": "2025-09-03T17:36:29.500928Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3711,7 +3711,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.345649Z",
+          "created_at": "2025-09-03T17:36:29.541823Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3729,7 +3729,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.39865Z",
+          "created_at": "2025-09-03T17:36:29.583225Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3747,7 +3747,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.44719Z",
+          "created_at": "2025-09-03T17:36:29.62471Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3765,7 +3765,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.499784Z",
+          "created_at": "2025-09-03T17:36:29.665624Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3783,7 +3783,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.552673Z",
+          "created_at": "2025-09-03T17:36:29.706601Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3801,7 +3801,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.60472Z",
+          "created_at": "2025-09-03T17:36:29.747221Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3819,7 +3819,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.656364Z",
+          "created_at": "2025-09-03T17:36:29.787753Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3837,7 +3837,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.710318Z",
+          "created_at": "2025-09-03T17:36:29.828297Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3855,7 +3855,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.763384Z",
+          "created_at": "2025-09-03T17:36:29.86906Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3873,7 +3873,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.813607Z",
+          "created_at": "2025-09-03T17:36:29.909608Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3891,7 +3891,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.866943Z",
+          "created_at": "2025-09-03T17:36:29.950119Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3909,7 +3909,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.918563Z",
+          "created_at": "2025-09-03T17:36:29.990856Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3927,7 +3927,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:26.969428Z",
+          "created_at": "2025-09-03T17:36:30.031737Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3945,7 +3945,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.023314Z",
+          "created_at": "2025-09-03T17:36:30.072804Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3963,7 +3963,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.075325Z",
+          "created_at": "2025-09-03T17:36:30.115879Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3981,7 +3981,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.128289Z",
+          "created_at": "2025-09-03T17:36:30.157268Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -3999,7 +3999,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.190218Z",
+          "created_at": "2025-09-03T17:36:30.198026Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4017,7 +4017,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.246086Z",
+          "created_at": "2025-09-03T17:36:30.238729Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4035,7 +4035,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.306117Z",
+          "created_at": "2025-09-03T17:36:30.279348Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4053,7 +4053,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.359915Z",
+          "created_at": "2025-09-03T17:36:30.31988Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4071,7 +4071,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.419018Z",
+          "created_at": "2025-09-03T17:36:30.360471Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4089,7 +4089,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.476634Z",
+          "created_at": "2025-09-03T17:36:30.401158Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4107,7 +4107,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.535904Z",
+          "created_at": "2025-09-03T17:36:30.441986Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4125,7 +4125,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.588323Z",
+          "created_at": "2025-09-03T17:36:30.482303Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4143,7 +4143,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.641718Z",
+          "created_at": "2025-09-03T17:36:30.523844Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4161,7 +4161,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.699892Z",
+          "created_at": "2025-09-03T17:36:30.564853Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4179,7 +4179,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.754283Z",
+          "created_at": "2025-09-03T17:36:30.605812Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4197,7 +4197,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.806748Z",
+          "created_at": "2025-09-03T17:36:30.646752Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4215,7 +4215,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.859134Z",
+          "created_at": "2025-09-03T17:36:30.68766Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4233,7 +4233,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.911671Z",
+          "created_at": "2025-09-03T17:36:30.728603Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4251,7 +4251,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:27.964185Z",
+          "created_at": "2025-09-03T17:36:30.769336Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4269,7 +4269,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.021644Z",
+          "created_at": "2025-09-03T17:36:30.80994Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4287,7 +4287,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.082519Z",
+          "created_at": "2025-09-03T17:36:30.850918Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4305,7 +4305,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.14397Z",
+          "created_at": "2025-09-03T17:36:30.89149Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4323,7 +4323,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.205905Z",
+          "created_at": "2025-09-03T17:36:30.932133Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4341,7 +4341,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.263955Z",
+          "created_at": "2025-09-03T17:36:30.97327Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4359,7 +4359,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.320542Z",
+          "created_at": "2025-09-03T17:36:31.016238Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4377,7 +4377,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.374084Z",
+          "created_at": "2025-09-03T17:36:31.057488Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4395,7 +4395,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.427518Z",
+          "created_at": "2025-09-03T17:36:31.097989Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4413,7 +4413,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.479545Z",
+          "created_at": "2025-09-03T17:36:31.13892Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4431,7 +4431,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.531416Z",
+          "created_at": "2025-09-03T17:36:31.179559Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4449,7 +4449,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.58181Z",
+          "created_at": "2025-09-03T17:36:31.220282Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4467,7 +4467,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.632489Z",
+          "created_at": "2025-09-03T17:36:31.260847Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4485,7 +4485,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.684096Z",
+          "created_at": "2025-09-03T17:36:31.301689Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4503,7 +4503,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.737131Z",
+          "created_at": "2025-09-03T17:36:31.342413Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4521,7 +4521,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.789945Z",
+          "created_at": "2025-09-03T17:36:31.383094Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4539,7 +4539,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.842126Z",
+          "created_at": "2025-09-03T17:36:31.424087Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4557,7 +4557,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.895142Z",
+          "created_at": "2025-09-03T17:36:31.465298Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4575,7 +4575,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:28.947434Z",
+          "created_at": "2025-09-03T17:36:31.506962Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4593,7 +4593,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.003682Z",
+          "created_at": "2025-09-03T17:36:31.548213Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4611,7 +4611,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.056399Z",
+          "created_at": "2025-09-03T17:36:31.589913Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4629,7 +4629,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.109724Z",
+          "created_at": "2025-09-03T17:36:31.630948Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4647,7 +4647,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.163194Z",
+          "created_at": "2025-09-03T17:36:31.672087Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4665,7 +4665,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.217213Z",
+          "created_at": "2025-09-03T17:36:31.713337Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4683,7 +4683,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.269168Z",
+          "created_at": "2025-09-03T17:36:31.754423Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4701,7 +4701,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.321308Z",
+          "created_at": "2025-09-03T17:36:31.795742Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4719,7 +4719,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.374321Z",
+          "created_at": "2025-09-03T17:36:31.836637Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4737,7 +4737,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.427106Z",
+          "created_at": "2025-09-03T17:36:31.878115Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4755,7 +4755,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.479022Z",
+          "created_at": "2025-09-03T17:36:31.919569Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4773,7 +4773,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.536933Z",
+          "created_at": "2025-09-03T17:36:31.960615Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4791,7 +4791,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.589411Z",
+          "created_at": "2025-09-03T17:36:32.001695Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4809,7 +4809,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.641976Z",
+          "created_at": "2025-09-03T17:36:32.042291Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4827,7 +4827,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.693984Z",
+          "created_at": "2025-09-03T17:36:32.082564Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4845,7 +4845,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.746091Z",
+          "created_at": "2025-09-03T17:36:32.123962Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4863,7 +4863,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.79699Z",
+          "created_at": "2025-09-03T17:36:32.164847Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4881,7 +4881,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.849326Z",
+          "created_at": "2025-09-03T17:36:32.205607Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4899,7 +4899,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.90127Z",
+          "created_at": "2025-09-03T17:36:32.246372Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4917,7 +4917,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:29.953331Z",
+          "created_at": "2025-09-03T17:36:32.287091Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4935,7 +4935,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.006229Z",
+          "created_at": "2025-09-03T17:36:32.32769Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4953,7 +4953,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.057576Z",
+          "created_at": "2025-09-03T17:36:32.368571Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4971,7 +4971,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.108201Z",
+          "created_at": "2025-09-03T17:36:32.409389Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -4989,7 +4989,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.159044Z",
+          "created_at": "2025-09-03T17:36:32.450109Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5007,7 +5007,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.211179Z",
+          "created_at": "2025-09-03T17:36:32.491077Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5025,7 +5025,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.26223Z",
+          "created_at": "2025-09-03T17:36:32.532737Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5043,7 +5043,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.314187Z",
+          "created_at": "2025-09-03T17:36:32.572701Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5061,7 +5061,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.368683Z",
+          "created_at": "2025-09-03T17:36:32.614093Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5079,7 +5079,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.423991Z",
+          "created_at": "2025-09-03T17:36:32.655113Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5097,7 +5097,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.475926Z",
+          "created_at": "2025-09-03T17:36:32.696438Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5115,7 +5115,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.535785Z",
+          "created_at": "2025-09-03T17:36:32.73788Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5133,7 +5133,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.591719Z",
+          "created_at": "2025-09-03T17:36:32.780775Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5151,7 +5151,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.645659Z",
+          "created_at": "2025-09-03T17:36:32.823196Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5169,7 +5169,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.698314Z",
+          "created_at": "2025-09-03T17:36:32.86428Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5187,7 +5187,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.747479Z",
+          "created_at": "2025-09-03T17:36:32.905305Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5205,7 +5205,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.799751Z",
+          "created_at": "2025-09-03T17:36:32.946086Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5223,7 +5223,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.854603Z",
+          "created_at": "2025-09-03T17:36:32.986849Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5241,7 +5241,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.907564Z",
+          "created_at": "2025-09-03T17:36:33.028251Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5259,7 +5259,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:30.961713Z",
+          "created_at": "2025-09-03T17:36:33.069225Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5277,7 +5277,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.016244Z",
+          "created_at": "2025-09-03T17:36:33.110717Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5295,7 +5295,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.069635Z",
+          "created_at": "2025-09-03T17:36:33.151703Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5313,7 +5313,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.1225Z",
+          "created_at": "2025-09-03T17:36:33.192643Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5331,7 +5331,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.17487Z",
+          "created_at": "2025-09-03T17:36:33.233604Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5349,7 +5349,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.226231Z",
+          "created_at": "2025-09-03T17:36:33.274665Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5367,7 +5367,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.28044Z",
+          "created_at": "2025-09-03T17:36:33.315311Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5385,7 +5385,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.338834Z",
+          "created_at": "2025-09-03T17:36:33.356272Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5403,7 +5403,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.39313Z",
+          "created_at": "2025-09-03T17:36:33.397164Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5421,7 +5421,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.443815Z",
+          "created_at": "2025-09-03T17:36:33.438163Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5439,7 +5439,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.496638Z",
+          "created_at": "2025-09-03T17:36:33.478995Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5457,7 +5457,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.549024Z",
+          "created_at": "2025-09-03T17:36:33.520178Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5475,7 +5475,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.604983Z",
+          "created_at": "2025-09-03T17:36:33.561169Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5493,7 +5493,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.657366Z",
+          "created_at": "2025-09-03T17:36:33.602614Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5511,7 +5511,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.710345Z",
+          "created_at": "2025-09-03T17:36:33.643517Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5529,7 +5529,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.761482Z",
+          "created_at": "2025-09-03T17:36:33.69501Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5547,7 +5547,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.812505Z",
+          "created_at": "2025-09-03T17:36:33.744642Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5565,7 +5565,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.864427Z",
+          "created_at": "2025-09-03T17:36:33.788023Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5583,7 +5583,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.915242Z",
+          "created_at": "2025-09-03T17:36:33.830123Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5601,7 +5601,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:31.967322Z",
+          "created_at": "2025-09-03T17:36:33.873234Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5619,7 +5619,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.018589Z",
+          "created_at": "2025-09-03T17:36:33.91574Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5637,7 +5637,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.070624Z",
+          "created_at": "2025-09-03T17:36:33.958165Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5655,7 +5655,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.121703Z",
+          "created_at": "2025-09-03T17:36:34.000544Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5673,7 +5673,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.174718Z",
+          "created_at": "2025-09-03T17:36:34.043824Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5691,7 +5691,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.23641Z",
+          "created_at": "2025-09-03T17:36:34.086339Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5709,7 +5709,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.294487Z",
+          "created_at": "2025-09-03T17:36:34.128863Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5727,7 +5727,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.354809Z",
+          "created_at": "2025-09-03T17:36:34.171675Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5745,7 +5745,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.409827Z",
+          "created_at": "2025-09-03T17:36:34.214025Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5763,7 +5763,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.467898Z",
+          "created_at": "2025-09-03T17:36:34.256135Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5781,7 +5781,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.525406Z",
+          "created_at": "2025-09-03T17:36:34.298571Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5799,7 +5799,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.580356Z",
+          "created_at": "2025-09-03T17:36:34.340742Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5817,7 +5817,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.637738Z",
+          "created_at": "2025-09-03T17:36:34.38192Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5835,7 +5835,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.691339Z",
+          "created_at": "2025-09-03T17:36:34.423807Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5853,7 +5853,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.75193Z",
+          "created_at": "2025-09-03T17:36:34.465059Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5871,7 +5871,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.809022Z",
+          "created_at": "2025-09-03T17:36:34.506527Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5889,7 +5889,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.868509Z",
+          "created_at": "2025-09-03T17:36:34.547797Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5907,7 +5907,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.927239Z",
+          "created_at": "2025-09-03T17:36:34.589189Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5925,7 +5925,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:32.985536Z",
+          "created_at": "2025-09-03T17:36:34.632479Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5943,7 +5943,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.040875Z",
+          "created_at": "2025-09-03T17:36:34.673914Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5961,7 +5961,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.099492Z",
+          "created_at": "2025-09-03T17:36:34.714561Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5979,7 +5979,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.151102Z",
+          "created_at": "2025-09-03T17:36:34.755794Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -5997,7 +5997,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.2036Z",
+          "created_at": "2025-09-03T17:36:34.797365Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6015,7 +6015,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.255217Z",
+          "created_at": "2025-09-03T17:36:34.839305Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6033,7 +6033,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.306726Z",
+          "created_at": "2025-09-03T17:36:34.881479Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6051,7 +6051,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.357871Z",
+          "created_at": "2025-09-03T17:36:34.923518Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6069,7 +6069,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.410678Z",
+          "created_at": "2025-09-03T17:36:34.964593Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6087,7 +6087,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.473848Z",
+          "created_at": "2025-09-03T17:36:35.005594Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6105,7 +6105,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.530364Z",
+          "created_at": "2025-09-03T17:36:35.047897Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6123,7 +6123,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.588387Z",
+          "created_at": "2025-09-03T17:36:35.088945Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6141,7 +6141,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.644848Z",
+          "created_at": "2025-09-03T17:36:35.130496Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6159,7 +6159,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.702142Z",
+          "created_at": "2025-09-03T17:36:35.171697Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6177,7 +6177,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.757078Z",
+          "created_at": "2025-09-03T17:36:35.212785Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6195,7 +6195,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.809287Z",
+          "created_at": "2025-09-03T17:36:35.254Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6213,7 +6213,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.863545Z",
+          "created_at": "2025-09-03T17:36:35.294945Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6231,7 +6231,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.921183Z",
+          "created_at": "2025-09-03T17:36:35.335904Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6249,7 +6249,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:33.972308Z",
+          "created_at": "2025-09-03T17:36:35.376911Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6267,7 +6267,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.024699Z",
+          "created_at": "2025-09-03T17:36:35.417931Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6285,7 +6285,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.078626Z",
+          "created_at": "2025-09-03T17:36:35.45891Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6303,7 +6303,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.132072Z",
+          "created_at": "2025-09-03T17:36:35.501211Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6321,7 +6321,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.185534Z",
+          "created_at": "2025-09-03T17:36:35.543696Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6339,7 +6339,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.237811Z",
+          "created_at": "2025-09-03T17:36:35.584233Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6357,7 +6357,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.289202Z",
+          "created_at": "2025-09-03T17:36:35.626596Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6375,7 +6375,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.341588Z",
+          "created_at": "2025-09-03T17:36:35.667752Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6393,7 +6393,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.393213Z",
+          "created_at": "2025-09-03T17:36:35.70907Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6411,7 +6411,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.444819Z",
+          "created_at": "2025-09-03T17:36:35.749741Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6429,7 +6429,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.497564Z",
+          "created_at": "2025-09-03T17:36:35.79089Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6447,7 +6447,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.552231Z",
+          "created_at": "2025-09-03T17:36:35.832516Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6465,7 +6465,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.608902Z",
+          "created_at": "2025-09-03T17:36:35.874088Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6483,7 +6483,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.66848Z",
+          "created_at": "2025-09-03T17:36:35.915661Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6501,7 +6501,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.721915Z",
+          "created_at": "2025-09-03T17:36:35.95745Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6519,7 +6519,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.776127Z",
+          "created_at": "2025-09-03T17:36:35.998856Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6537,7 +6537,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.833308Z",
+          "created_at": "2025-09-03T17:36:36.040666Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6555,7 +6555,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.889407Z",
+          "created_at": "2025-09-03T17:36:36.082075Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6573,7 +6573,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.942394Z",
+          "created_at": "2025-09-03T17:36:36.123665Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6591,7 +6591,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:34.997254Z",
+          "created_at": "2025-09-03T17:36:36.164998Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6609,7 +6609,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.049568Z",
+          "created_at": "2025-09-03T17:36:36.206212Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6627,7 +6627,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.101649Z",
+          "created_at": "2025-09-03T17:36:36.24761Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6645,7 +6645,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.151407Z",
+          "created_at": "2025-09-03T17:36:36.288872Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6663,7 +6663,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.20241Z",
+          "created_at": "2025-09-03T17:36:36.330688Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6681,7 +6681,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.254715Z",
+          "created_at": "2025-09-03T17:36:36.372212Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6699,7 +6699,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.305634Z",
+          "created_at": "2025-09-03T17:36:36.415315Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6717,7 +6717,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.357517Z",
+          "created_at": "2025-09-03T17:36:36.458461Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6735,7 +6735,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.410715Z",
+          "created_at": "2025-09-03T17:36:36.501868Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6753,7 +6753,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.464886Z",
+          "created_at": "2025-09-03T17:36:36.544291Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6771,7 +6771,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.515495Z",
+          "created_at": "2025-09-03T17:36:36.58593Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6789,7 +6789,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.566584Z",
+          "created_at": "2025-09-03T17:36:36.627055Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6807,7 +6807,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.616019Z",
+          "created_at": "2025-09-03T17:36:36.668404Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6825,7 +6825,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.669824Z",
+          "created_at": "2025-09-03T17:36:36.709546Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6843,7 +6843,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.724262Z",
+          "created_at": "2025-09-03T17:36:36.750533Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6861,7 +6861,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.779373Z",
+          "created_at": "2025-09-03T17:36:36.792039Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6879,7 +6879,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.834386Z",
+          "created_at": "2025-09-03T17:36:36.833512Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6897,7 +6897,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.887658Z",
+          "created_at": "2025-09-03T17:36:36.875114Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6915,7 +6915,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.940042Z",
+          "created_at": "2025-09-03T17:36:36.916425Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6933,7 +6933,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:35.996154Z",
+          "created_at": "2025-09-03T17:36:36.959229Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6951,7 +6951,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.054767Z",
+          "created_at": "2025-09-03T17:36:37.000732Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6969,7 +6969,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.110188Z",
+          "created_at": "2025-09-03T17:36:37.042352Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -6987,7 +6987,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.172356Z",
+          "created_at": "2025-09-03T17:36:37.083572Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -7005,7 +7005,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.229749Z",
+          "created_at": "2025-09-03T17:36:37.125478Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -7023,7 +7023,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.287566Z",
+          "created_at": "2025-09-03T17:36:37.166749Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -7041,7 +7041,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.343992Z",
+          "created_at": "2025-09-03T17:36:37.207713Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -7059,7 +7059,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.402701Z",
+          "created_at": "2025-09-03T17:36:37.249261Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -7077,7 +7077,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.455985Z",
+          "created_at": "2025-09-03T17:36:37.291638Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -7095,15 +7095,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:36.508093Z",
+          "created_at": "2025-09-03T17:36:37.333479Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 21827314917,
-          "load_duration": 60502000,
+          "total_duration": 16422193500,
+          "load_duration": 146702667,
           "prompt_eval_count": 36,
-          "prompt_eval_duration": 75000000,
+          "prompt_eval_duration": 78361500,
           "eval_count": 394,
-          "eval_duration": 21690000000,
+          "eval_duration": 16196482750,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/d0ac68cbde69.json b/tests/integration/recordings/responses/d0ac68cbde69.json
index 5c19e7c5a..750c5c69b 100644
--- a/tests/integration/recordings/responses/d0ac68cbde69.json
+++ b/tests/integration/recordings/responses/d0ac68cbde69.json
@@ -13,21 +13,21 @@
       "__data__": {
         "models": [
           {
-            "model": "llama3.2:3b-instruct-fp16",
-            "name": "llama3.2:3b-instruct-fp16",
-            "digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
-            "expires_at": "2025-08-18T13:47:44.262256-07:00",
-            "size": 7919570944,
-            "size_vram": 7919570944,
+            "model": "llama3.2-vision:11b",
+            "name": "llama3.2-vision:11b",
+            "digest": "6f2f9757ae97e8a3f8ea33d6adb2b11d93d9a35bef277cd2c0b1b5af8e8d0b1e",
+            "expires_at": "2025-09-03T11:51:35.966409-07:00",
+            "size": 12401209008,
+            "size_vram": 12401209008,
             "details": {
               "parent_model": "",
               "format": "gguf",
-              "family": "llama",
+              "family": "mllama",
               "families": [
-                "llama"
+                "mllama"
               ],
-              "parameter_size": "3.2B",
-              "quantization_level": "F16"
+              "parameter_size": "10.7B",
+              "quantization_level": "Q4_K_M"
             }
           }
         ]
diff --git a/tests/integration/recordings/responses/d4c86ac355fb.json b/tests/integration/recordings/responses/d4c86ac355fb.json
index 399c99e96..5dd3c7cc2 100644
--- a/tests/integration/recordings/responses/d4c86ac355fb.json
+++ b/tests/integration/recordings/responses/d4c86ac355fb.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:54.357928Z",
+        "created_at": "2025-09-03T17:37:35.824092Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 227148458,
-        "load_duration": 113314916,
+        "total_duration": 270017875,
+        "load_duration": 183186083,
         "prompt_eval_count": 220,
-        "prompt_eval_duration": 83000000,
+        "prompt_eval_duration": 74457250,
         "eval_count": 2,
-        "eval_duration": 27000000,
+        "eval_duration": 11684125,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/d86d4fc1eaca.json b/tests/integration/recordings/responses/d86d4fc1eaca.json
index 165e65093..b22354c20 100644
--- a/tests/integration/recordings/responses/d86d4fc1eaca.json
+++ b/tests/integration/recordings/responses/d86d4fc1eaca.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.043112263,
-              0.008686894,
-              0.06879597,
-              0.018093547,
-              0.04600579,
-              0.0026370327,
-              -0.0032194739,
-              -0.04128641,
-              -0.090751864,
-              -0.03311354,
-              -0.026625047,
-              0.007723082,
-              0.02020638,
-              -0.032501053,
-              -0.03582959,
-              0.031117352,
-              -0.03921459,
-              -0.011261255,
-              -0.10972644,
-              -0.12942035,
-              0.0180839,
-              0.011446483,
-              -0.07227963,
-              -0.013646516,
-              0.035441313,
-              0.024786202,
-              0.033887945,
-              0.072541736,
-              -0.012643559,
-              -0.058576923,
-              0.05788946,
-              -0.08161914,
-              0.064951725,
-              0.0013679718,
-              -0.067565694,
-              0.03500105,
-              -0.04499739,
-              -0.004745917,
-              0.04001028,
-              -0.010447466,
-              0.01971203,
-              -0.09853681,
-              -0.012831109,
-              0.018893523,
-              0.09566803,
-              0.11574249,
-              -0.040688448,
-              -0.026871145,
-              -0.046950754,
-              0.022665758,
-              -0.088503055,
-              -0.02349465,
-              -0.022964876,
-              -0.031086901,
-              -0.052040946,
-              0.042409953,
-              0.011587446,
-              0.06698339,
-              0.027131157,
-              -0.0021599897,
-              0.04676616,
-              -0.08205926,
-              -0.038376193,
-              0.052162487,
-              0.097754784,
-              -0.0006300649,
-              -0.051922448,
-              0.09102494,
-              -0.016122114,
-              -0.068757266,
-              0.007674277,
-              0.07676188,
-              -0.0017702047,
-              0.014375106,
-              0.038056612,
-              -0.0044639558,
-              0.01128439,
-              0.0006278256,
-              0.08837875,
-              -0.059357397,
-              -0.042713538,
-              -0.048170365,
-              -0.053083148,
-              0.03308664,
-              0.008073919,
-              -0.042588204,
-              -0.038085114,
-              -0.0071590515,
-              0.010923276,
-              -0.05467666,
-              0.039005354,
-              -0.06774879,
-              -0.023520455,
-              -0.038865313,
-              0.03465567,
-              0.015331597,
-              0.0073779793,
-              -0.123536974,
-              0.03618996,
-              0.13191763,
-              -0.06441666,
-              0.03345934,
-              -0.014335858,
-              0.0014165065,
-              0.031064518,
-              -0.039842315,
-              0.02367409,
-              -0.0028713108,
-              0.09695666,
-              -0.13332556,
-              -0.054217666,
-              0.019605756,
-              0.069848165,
-              -0.05345,
-              0.0018457369,
-              0.021261381,
-              0.019834742,
-              0.0364726,
-              0.008800545,
-              0.01899199,
-              -0.07162491,
-              -0.018764688,
-              0.030988883,
-              0.09103274,
-              0.016486289,
-              -0.08622413,
-              -0.083044365,
-              -1.3872017e-34,
-              -0.07202043,
-              -0.04547031,
-              -0.02789685,
-              0.058260243,
-              -0.010473749,
-              -0.06121573,
-              0.026039537,
-              -0.06574506,
-              0.029187253,
-              0.012286592,
-              -0.0634218,
-              0.040592846,
-              0.036436044,
-              0.019791061,
-              0.087508686,
-              0.02819681,
-              0.044173952,
-              0.076273374,
-              0.029475076,
-              -0.0022728525,
-              0.043047428,
-              0.025950495,
-              5.87631e-06,
-              -0.038482204,
-              -0.016193746,
-              0.03337992,
-              0.021100886,
-              -0.023393923,
-              0.009839609,
-              0.033582654,
-              0.030119505,
-              0.060411848,
-              -0.06525265,
-              -0.016019775,
-              0.01918547,
-              -0.0026020391,
-              -0.046634916,
-              0.02794535,
-              0.02097679,
-              0.007491536,
-              -0.048716933,
-              -0.007056093,
-              0.019862399,
-              0.01642084,
-              -0.06380952,
-              0.0312326,
-              0.09198801,
-              -0.031442497,
-              0.022264522,
-              -0.015000218,
-              0.002577486,
-              -0.031360134,
-              -0.015259252,
-              -0.025491642,
-              0.082340494,
-              0.14332701,
-              -0.02549817,
-              -0.005105692,
-              -0.023140578,
-              -0.031175751,
-              0.069945835,
-              0.030767307,
-              0.048112787,
-              0.03713218,
-              0.006838781,
-              0.0676382,
-              0.049743734,
-              0.008490252,
-              0.0717143,
-              0.007724331,
-              -0.0051555126,
-              -0.0031412526,
-              0.024659572,
-              -0.06878996,
-              0.052448474,
-              -0.009324618,
-              0.10184338,
-              -0.01364986,
-              -0.022692662,
-              0.0214144,
-              -0.09594176,
-              0.024049604,
-              -0.07207682,
-              -0.044615954,
-              0.03346317,
-              -0.03939876,
-              0.020151427,
-              -0.07493882,
-              -0.008306699,
-              0.013818277,
-              -0.098477356,
-              0.03363548,
-              0.08237572,
-              -0.0034042797,
-              -0.05002446,
-              -2.0284525e-33,
-              -0.1366396,
-              0.06461703,
-              0.05217467,
-              0.10100113,
-              0.01633431,
-              -0.012683015,
-              -0.09023996,
-              -0.023585103,
-              0.005757103,
-              0.102958955,
-              -0.025938109,
-              -0.04024086,
-              0.03442524,
-              0.019281812,
-              -0.05693542,
-              0.019865949,
-              0.01892263,
-              -0.03937148,
-              0.011244816,
-              0.05603835,
-              -0.015989995,
-              0.058931332,
-              -0.03825127,
-              -0.030448802,
-              -0.021279855,
-              0.031412993,
-              -0.021256046,
-              -0.013973024,
-              -0.051028315,
-              0.048959594,
-              0.018415732,
-              -0.015543872,
-              -0.050339997,
-              0.053825643,
-              -0.05102614,
-              0.016936453,
-              -0.03276066,
-              -0.025018891,
-              0.00083950633,
-              0.10212479,
-              0.047226448,
-              0.01013783,
-              -0.11656542,
-              0.012194899,
-              -0.029693797,
-              -0.099592775,
-              -0.05208683,
-              0.068527095,
-              0.05462999,
-              -0.06600112,
-              0.025495205,
-              0.013553149,
-              0.008376301,
-              -0.10753366,
-              -0.08184969,
-              0.07179369,
-              0.008020084,
-              -0.013001388,
-              0.02034551,
-              0.07830072,
-              -0.073259205,
-              -0.11530623,
-              0.040887818,
-              0.04355819,
-              -0.001209231,
-              0.045809098,
-              -0.00439629,
-              0.07479018,
-              -0.017603617,
-              -0.046038117,
-              0.022736022,
-              0.057742845,
-              -0.015455795,
-              0.0078048306,
-              -0.043795776,
-              -0.05287881,
-              -0.08780934,
-              0.016208123,
-              -0.018338274,
-              -0.05680242,
-              0.036081936,
-              -0.040417098,
-              0.039246004,
-              0.083620116,
-              -0.019201642,
-              0.055849098,
-              0.047579776,
-              -0.07378654,
-              0.033696014,
-              -0.08679882,
-              -0.0106773665,
-              0.052387673,
-              0.009724484,
-              0.023857431,
-              -0.08621698,
-              -1.7164837e-08,
-              0.021028662,
-              -0.05131077,
-              0.11875527,
-              -0.04681493,
-              0.06569432,
-              0.05875326,
-              -0.050507378,
-              0.05572548,
-              -0.040579688,
-              0.05569073,
-              0.025022164,
-              -0.001695402,
-              -0.03103065,
-              0.022217639,
-              0.02812072,
-              0.031644266,
-              -0.025532138,
-              0.020890266,
-              -0.023071108,
-              0.013451792,
-              0.07502988,
-              0.022283832,
-              0.028922528,
-              -0.014248503,
-              0.025503293,
-              -0.051433153,
-              -0.0144749675,
-              0.014626067,
-              -0.028012041,
-              0.08404862,
-              -0.07754722,
-              0.03867142,
-              -0.004333606,
-              0.025680339,
-              0.12575574,
-              0.07000303,
-              0.0059297155,
-              -0.104100324,
-              -0.041432552,
-              0.016101085,
-              -0.040745873,
-              0.017750472,
-              -0.09112738,
-              -0.026067602,
-              0.055624463,
-              0.016697235,
-              0.016438706,
-              -0.11938217,
-              0.027880691,
-              0.015196545,
-              0.042352572,
-              0.06814026,
-              0.057811365,
-              0.063263096,
-              0.067467265,
-              0.059775982,
-              0.06467763,
-              -0.067497864,
-              -0.035580758,
-              0.06402302,
-              0.008630453,
-              0.0031874685,
-              0.009377425,
-              -0.08392178
+              -0.04308226,
+              0.008707138,
+              0.06876158,
+              0.018115537,
+              0.04603657,
+              0.0026118131,
+              -0.0032358477,
+              -0.041284926,
+              -0.09074888,
+              -0.033087812,
+              -0.026611822,
+              0.0077352105,
+              0.020191023,
+              -0.03254043,
+              -0.035847843,
+              0.031108031,
+              -0.039247137,
+              -0.011286401,
+              -0.109710276,
+              -0.12942196,
+              0.018077252,
+              0.011446383,
+              -0.07231236,
+              -0.013655743,
+              0.035438832,
+              0.024783252,
+              0.03387316,
+              0.0726014,
+              -0.012643238,
+              -0.058606703,
+              0.057943814,
+              -0.08163548,
+              0.064962864,
+              0.0013675748,
+              -0.06751009,
+              0.03504323,
+              -0.044962864,
+              -0.004789603,
+              0.039971247,
+              -0.010461211,
+              0.019703588,
+              -0.09856083,
+              -0.01284534,
+              0.018876119,
+              0.09569305,
+              0.11571406,
+              -0.040684983,
+              -0.026837468,
+              -0.046950106,
+              0.022655226,
+              -0.0884734,
+              -0.023497678,
+              -0.022986038,
+              -0.031128721,
+              -0.052087843,
+              0.04241795,
+              0.011578454,
+              0.06702011,
+              0.027121129,
+              -0.0021518404,
+              0.04675332,
+              -0.082024105,
+              -0.038331598,
+              0.05215799,
+              0.097757615,
+              -0.0006708623,
+              -0.051935766,
+              0.09100271,
+              -0.016111707,
+              -0.06877312,
+              0.00767068,
+              0.076737314,
+              -0.0017499238,
+              0.014369293,
+              0.038031887,
+              -0.0044654603,
+              0.011287075,
+              0.0006178959,
+              0.08834809,
+              -0.05933476,
+              -0.042706404,
+              -0.048178285,
+              -0.053068914,
+              0.033110976,
+              0.008051986,
+              -0.042581946,
+              -0.038104057,
+              -0.007202849,
+              0.010891519,
+              -0.05466173,
+              0.03903238,
+              -0.06774145,
+              -0.02356764,
+              -0.03883483,
+              0.03464186,
+              0.015297014,
+              0.0073803077,
+              -0.12351391,
+              0.036168184,
+              0.13193323,
+              -0.06441449,
+              0.033508655,
+              -0.01435515,
+              0.0014314495,
+              0.031048443,
+              -0.03981852,
+              0.0236718,
+              -0.0028333638,
+              0.096959464,
+              -0.13331193,
+              -0.054209094,
+              0.019610135,
+              0.06984815,
+              -0.05347757,
+              0.0018131314,
+              0.02127606,
+              0.01981612,
+              0.036502477,
+              0.008825069,
+              0.018954003,
+              -0.07161326,
+              -0.018733062,
+              0.031044634,
+              0.09102944,
+              0.016508427,
+              -0.08625295,
+              -0.08300717,
+              -1.4044197e-34,
+              -0.072007515,
+              -0.045496386,
+              -0.027986562,
+              0.05823018,
+              -0.010462877,
+              -0.06121516,
+              0.026053715,
+              -0.06574638,
+              0.029178392,
+              0.012307141,
+              -0.06338016,
+              0.040593755,
+              0.03648161,
+              0.01977942,
+              0.08755496,
+              0.028216325,
+              0.044194777,
+              0.076237544,
+              0.02949726,
+              -0.0022650051,
+              0.04304541,
+              0.025918182,
+              1.2261046e-05,
+              -0.038463842,
+              -0.0161955,
+              0.03338553,
+              0.02112944,
+              -0.023382189,
+              0.009846733,
+              0.033575017,
+              0.030112585,
+              0.060389582,
+              -0.06522927,
+              -0.016030189,
+              0.019156763,
+              -0.002600835,
+              -0.04663393,
+              0.02794595,
+              0.021004112,
+              0.0074595963,
+              -0.048745092,
+              -0.0070450655,
+              0.019834043,
+              0.016411202,
+              -0.06381404,
+              0.031237993,
+              0.091976196,
+              -0.0313931,
+              0.022238847,
+              -0.015018542,
+              0.0025784613,
+              -0.031382624,
+              -0.0152902305,
+              -0.025491757,
+              0.08233924,
+              0.14333151,
+              -0.0255008,
+              -0.005104579,
+              -0.02309693,
+              -0.03117742,
+              0.06995927,
+              0.030787794,
+              0.04810884,
+              0.037135385,
+              0.0068392092,
+              0.06759879,
+              0.049763102,
+              0.008472162,
+              0.07170584,
+              0.0076969583,
+              -0.005139827,
+              -0.0031728086,
+              0.024646448,
+              -0.06879641,
+              0.05249289,
+              -0.009404918,
+              0.10184627,
+              -0.013639711,
+              -0.022681188,
+              0.021382388,
+              -0.09593746,
+              0.024071718,
+              -0.072101034,
+              -0.04462981,
+              0.033456877,
+              -0.03942254,
+              0.020099705,
+              -0.07495305,
+              -0.008311987,
+              0.013811793,
+              -0.09847922,
+              0.0336409,
+              0.08235891,
+              -0.0034134828,
+              -0.05005179,
+              -2.0283256e-33,
+              -0.13664234,
+              0.06463093,
+              0.05221015,
+              0.10102781,
+              0.016344123,
+              -0.01269384,
+              -0.09024102,
+              -0.023596523,
+              0.0057664234,
+              0.10294541,
+              -0.025930807,
+              -0.040247634,
+              0.034446176,
+              0.019228913,
+              -0.056902077,
+              0.019905953,
+              0.018969242,
+              -0.039362065,
+              0.011287794,
+              0.056024995,
+              -0.016000811,
+              0.058928564,
+              -0.038211577,
+              -0.030445429,
+              -0.02130076,
+              0.031401403,
+              -0.021228284,
+              -0.01400283,
+              -0.051042903,
+              0.048970606,
+              0.018451849,
+              -0.015488385,
+              -0.05033241,
+              0.053844187,
+              -0.050984643,
+              0.016940817,
+              -0.032773405,
+              -0.02502497,
+              0.000826887,
+              0.10213942,
+              0.04724571,
+              0.010156266,
+              -0.11653258,
+              0.012165439,
+              -0.029735534,
+              -0.09959623,
+              -0.052066926,
+              0.06851813,
+              0.054645896,
+              -0.066007115,
+              0.025503889,
+              0.013539478,
+              0.008429433,
+              -0.10756056,
+              -0.08184448,
+              0.07179834,
+              0.007978949,
+              -0.013011469,
+              0.020322459,
+              0.07827889,
+              -0.07320297,
+              -0.1153648,
+              0.04087073,
+              0.04355079,
+              -0.0012279376,
+              0.045840748,
+              -0.004366462,
+              0.074786335,
+              -0.017625354,
+              -0.046014115,
+              0.022716347,
+              0.057738,
+              -0.015408269,
+              0.007771719,
+              -0.04381374,
+              -0.05289107,
+              -0.08783473,
+              0.016243288,
+              -0.018398289,
+              -0.05679973,
+              0.036058675,
+              -0.040418148,
+              0.039242174,
+              0.083593465,
+              -0.019223504,
+              0.05582025,
+              0.04756948,
+              -0.07378718,
+              0.03371102,
+              -0.08680738,
+              -0.010659349,
+              0.0524085,
+              0.009771544,
+              0.023841262,
+              -0.086208895,
+              -1.7164519e-08,
+              0.021028979,
+              -0.051292755,
+              0.11877283,
+              -0.04687027,
+              0.06566496,
+              0.058750976,
+              -0.050496,
+              0.055720143,
+              -0.040577173,
+              0.055665523,
+              0.025019526,
+              -0.001681203,
+              -0.031047702,
+              0.022228474,
+              0.028109053,
+              0.03163934,
+              -0.025502652,
+              0.020898303,
+              -0.023064507,
+              0.013436037,
+              0.07504084,
+              0.022279648,
+              0.028908938,
+              -0.014271217,
+              0.025474275,
+              -0.051414162,
+              -0.014502164,
+              0.014646399,
+              -0.028023712,
+              0.08406334,
+              -0.07755092,
+              0.038713943,
+              -0.0043370826,
+              0.025676368,
+              0.12571524,
+              0.06996381,
+              0.0059321956,
+              -0.10410214,
+              -0.041439336,
+              0.016119901,
+              -0.040744506,
+              0.017772397,
+              -0.09114363,
+              -0.026066387,
+              0.055598073,
+              0.016705057,
+              0.016444646,
+              -0.11935461,
+              0.02789905,
+              0.0151745565,
+              0.042357437,
+              0.06817164,
+              0.05782822,
+              0.063278705,
+              0.06748475,
+              0.059781626,
+              0.06468886,
+              -0.06749451,
+              -0.035589237,
+              0.0640055,
+              0.008595763,
+              0.003157698,
+              0.009343837,
+              -0.08392565
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/dac7a32e5db9.json b/tests/integration/recordings/responses/dac7a32e5db9.json
index a28144442..97d1fccfc 100644
--- a/tests/integration/recordings/responses/dac7a32e5db9.json
+++ b/tests/integration/recordings/responses/dac7a32e5db9.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-07-31T17:50:00.921192644Z",
+        "created_at": "2025-09-03T17:39:36.919474Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 2073152067,
-        "load_duration": 42902450,
+        "total_duration": 470635833,
+        "load_duration": 113755958,
         "prompt_eval_count": 23,
-        "prompt_eval_duration": 795517987,
+        "prompt_eval_duration": 67480542,
         "eval_count": 8,
-        "eval_duration": 1234259942,
+        "eval_duration": 288746541,
         "response": "The capital of France is Paris.",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/dd226d71f844.json b/tests/integration/recordings/responses/dd226d71f844.json
index 2b8b52a63..ba2810bc9 100644
--- a/tests/integration/recordings/responses/dd226d71f844.json
+++ b/tests/integration/recordings/responses/dd226d71f844.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.381208Z",
+          "created_at": "2025-09-03T17:38:05.682744Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.441511Z",
+          "created_at": "2025-09-03T17:38:05.72605Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.499052Z",
+          "created_at": "2025-09-03T17:38:05.770654Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.577259Z",
+          "created_at": "2025-09-03T17:38:05.819087Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.635016Z",
+          "created_at": "2025-09-03T17:38:05.862915Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.68944Z",
+          "created_at": "2025-09-03T17:38:05.913209Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.742314Z",
+          "created_at": "2025-09-03T17:38:05.951646Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.795086Z",
+          "created_at": "2025-09-03T17:38:05.996738Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.847905Z",
+          "created_at": "2025-09-03T17:38:06.046726Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.898666Z",
+          "created_at": "2025-09-03T17:38:06.08508Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:25.952292Z",
+          "created_at": "2025-09-03T17:38:06.128566Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:26.001903Z",
+          "created_at": "2025-09-03T17:38:06.173309Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,15 +238,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:26.053764Z",
+          "created_at": "2025-09-03T17:38:06.218818Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 880684833,
-          "load_duration": 101945250,
+          "total_duration": 755252250,
+          "load_duration": 141479625,
           "prompt_eval_count": 402,
-          "prompt_eval_duration": 100000000,
+          "prompt_eval_duration": 76304166,
           "eval_count": 13,
-          "eval_duration": 677000000,
+          "eval_duration": 536202125,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/dd9e7d5913e9.json b/tests/integration/recordings/responses/dd9e7d5913e9.json
index 8f4b0ef30..e3d8b41f5 100644
--- a/tests/integration/recordings/responses/dd9e7d5913e9.json
+++ b/tests/integration/recordings/responses/dd9e7d5913e9.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:41.559883Z",
+          "created_at": "2025-09-03T17:36:40.972565Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,15 +39,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-04T22:55:41.619829Z",
+          "created_at": "2025-09-03T17:36:41.014682Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 915493834,
-          "load_duration": 167838417,
+          "total_duration": 693115125,
+          "load_duration": 114019375,
           "prompt_eval_count": 386,
-          "prompt_eval_duration": 683000000,
+          "prompt_eval_duration": 535931209,
           "eval_count": 2,
-          "eval_duration": 63000000,
+          "eval_duration": 42505166,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/decfd950646c.json b/tests/integration/recordings/responses/decfd950646c.json
index f62340c27..c46fa8686 100644
--- a/tests/integration/recordings/responses/decfd950646c.json
+++ b/tests/integration/recordings/responses/decfd950646c.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -44,32 +44,22 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-620",
+          "id": "chatcmpl-202",
           "choices": [
             {
               "delta": {
-                "content": "",
+                "content": "{\"name\":\"get_weather\",\"parameters{\"key\"]=\"Tokyo\"}}",
                 "function_call": null,
                 "refusal": null,
                 "role": "assistant",
-                "tool_calls": [
-                  {
-                    "index": 0,
-                    "id": "call_490d5ur7",
-                    "function": {
-                      "arguments": "{\"city\":\"Tokyo\"}",
-                      "name": "get_weather"
-                    },
-                    "type": "function"
-                  }
-                ]
+                "tool_calls": null
               },
               "finish_reason": null,
               "index": 0,
               "logprobs": null
             }
           ],
-          "created": 1755228972,
+          "created": 1756921363,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
@@ -80,7 +70,7 @@
       {
         "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
         "__data__": {
-          "id": "chatcmpl-620",
+          "id": "chatcmpl-202",
           "choices": [
             {
               "delta": {
@@ -90,12 +80,12 @@
                 "role": "assistant",
                 "tool_calls": null
               },
-              "finish_reason": "tool_calls",
+              "finish_reason": "stop",
               "index": 0,
               "logprobs": null
             }
           ],
-          "created": 1755228972,
+          "created": 1756921363,
           "model": "llama3.2:3b-instruct-fp16",
           "object": "chat.completion.chunk",
           "service_tier": null,
diff --git a/tests/integration/recordings/responses/e0a6dce1d94b.json b/tests/integration/recordings/responses/e0a6dce1d94b.json
index 08fd4df2c..4a285b30b 100644
--- a/tests/integration/recordings/responses/e0a6dce1d94b.json
+++ b/tests/integration/recordings/responses/e0a6dce1d94b.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.028391164,
-              0.08177924,
-              -0.078595236,
-              0.02794012,
-              0.0501054,
-              -0.03523528,
-              -0.0040212795,
-              0.029318463,
-              -0.057719484,
-              0.013758128,
-              0.14608414,
-              -0.012030242,
-              -0.0244042,
-              -0.05507163,
-              -0.026622117,
-              -0.0132702645,
-              -0.109127365,
-              -0.037243392,
-              -0.003585629,
-              0.047631495,
-              0.062134072,
-              0.0070668682,
-              -0.015537441,
-              -0.0080097895,
-              0.03766712,
-              0.015882641,
-              -0.041853406,
-              0.09733282,
-              -0.025634848,
-              -0.11367206,
-              0.035507742,
-              0.07039588,
-              0.016794816,
-              0.022213018,
-              0.12344487,
-              0.007708932,
-              0.12549855,
-              0.00806089,
-              -0.02614805,
-              0.0028652712,
-              0.018172521,
-              -0.046700634,
-              0.04102468,
-              0.001336475,
-              0.0019230411,
-              0.008665353,
-              0.016688382,
-              0.022002129,
-              0.0020729597,
-              -0.03286714,
-              -0.08643458,
-              0.008018572,
-              -0.07433228,
-              -0.01628817,
-              0.060542718,
-              0.005992304,
-              0.016035207,
-              0.021369386,
-              0.009568174,
-              0.03177933,
-              0.023040457,
-              0.03435853,
-              -0.042258766,
-              0.024753148,
-              0.11620828,
-              -0.02494626,
-              -0.03897831,
-              -0.024997817,
-              -0.020839883,
-              -0.08836877,
-              -0.15072803,
-              0.020933837,
-              -0.022511186,
-              0.0023899842,
-              0.0057860566,
-              -0.001578469,
-              -0.11986527,
-              -0.003025397,
-              0.055101633,
-              -0.11829019,
-              -0.05885812,
-              -0.1504569,
-              0.01861341,
-              -0.009307191,
-              -0.028901236,
-              0.08401475,
-              0.043742407,
-              -0.0006705526,
-              -0.052525397,
-              0.00025590818,
-              0.040425412,
-              0.0066513056,
-              0.026082706,
-              0.051888794,
-              0.01259031,
-              0.061460704,
-              0.013889724,
-              0.03844097,
-              0.048208673,
-              0.10407735,
-              -0.02645537,
-              -0.021476867,
-              -0.020856835,
-              0.050631326,
-              -0.05169685,
-              -0.07577173,
-              0.05749261,
-              -0.0499922,
-              0.06527451,
-              -0.02872225,
-              0.03874818,
-              -0.062776215,
-              -0.014480463,
-              -0.06345894,
-              0.06641256,
-              -0.014838074,
-              -0.03524914,
-              0.07739568,
-              -0.039939843,
-              0.032204024,
-              0.10169046,
-              -0.022527538,
-              -0.05930125,
-              0.00039771595,
-              -0.057792112,
-              -0.070337616,
-              0.06377354,
-              -4.088526e-33,
-              -0.021773575,
-              -0.079873994,
-              -0.013886454,
-              0.14922747,
-              0.025207443,
-              -0.042269774,
-              -0.0067705857,
-              0.054603398,
-              -0.092237934,
-              0.008083855,
-              -0.03861146,
-              -0.11771469,
-              0.012989592,
-              0.034553546,
-              -0.017051153,
-              0.011906159,
-              0.012945488,
-              0.042745717,
-              -0.01759736,
-              -0.018408326,
-              0.06513165,
-              0.0405268,
-              -0.022535695,
-              -0.06094611,
-              -0.018629104,
-              0.011654488,
-              0.014083773,
-              -0.067636594,
-              0.08541857,
-              0.030126775,
-              0.010824449,
-              -0.054840527,
-              -0.024132056,
-              0.048314847,
-              0.007516418,
-              0.013355685,
-              0.024563083,
-              -0.005942082,
-              -0.045623902,
-              -0.004832818,
-              0.004424451,
-              -0.0023969507,
-              0.013589571,
-              -0.0168692,
-              0.06961138,
-              -0.07734751,
-              0.020551285,
-              0.0048098145,
-              0.055662792,
-              0.013124815,
-              -0.011720894,
-              0.04093993,
-              0.007497743,
-              0.042012148,
-              0.010350773,
-              0.019379916,
-              0.01108285,
-              0.017257342,
-              0.018258827,
-              0.0773061,
-              0.01962173,
-              0.052673563,
-              -0.05859421,
-              0.039764106,
-              -0.05021828,
-              -0.04896494,
-              -0.05262346,
-              -0.09227966,
-              0.07557037,
-              0.08099812,
-              -0.02225778,
-              -0.04215297,
-              0.056577113,
-              0.02356105,
-              0.0015294012,
-              -0.049797468,
-              0.0023656262,
-              0.028645845,
-              -0.06897522,
-              -0.0477758,
-              -0.04864175,
-              -0.0766266,
-              -0.032856915,
-              -0.046002492,
-              -0.057314955,
-              -0.08091142,
-              -0.008058203,
-              -0.09362831,
-              0.0512433,
-              -0.05832409,
-              -0.00059281266,
-              0.022221608,
-              -0.046930317,
-              -0.08964614,
-              0.11954097,
-              2.044738e-33,
-              0.01219642,
-              0.08643133,
-              -0.023233324,
-              0.002765521,
-              -0.0010344109,
-              0.034877002,
-              0.07328553,
-              -0.04988436,
-              -0.04193409,
-              0.13485521,
-              -0.006909938,
-              0.0062319604,
-              0.059107542,
-              -0.028918913,
-              0.09142895,
-              -0.018481337,
-              0.00771716,
-              -0.04420843,
-              -0.025174472,
-              -0.0150115965,
-              -0.03543459,
-              0.124125846,
-              0.13119355,
-              0.08100271,
-              -0.033272874,
-              0.0039677722,
-              0.02646281,
-              0.026607113,
-              0.017331243,
-              -0.0036059914,
-              0.03546072,
-              0.059571866,
-              -0.12454768,
-              0.021932347,
-              0.02564387,
-              -0.11062035,
-              0.09607079,
-              -0.06733944,
-              -0.01182028,
-              0.0423393,
-              0.0378881,
-              0.1058394,
-              0.00734931,
-              0.066321366,
-              0.022943782,
-              0.049426265,
-              0.14638706,
-              -0.0067357672,
-              0.0043576923,
-              -0.029188734,
-              -0.009015755,
-              -0.08637437,
-              0.035848346,
-              0.0030120711,
-              -0.029328048,
-              0.070184804,
-              0.014865788,
-              0.028357765,
-              -0.040338036,
-              0.019171577,
-              0.015582609,
-              0.028644681,
-              -0.019528968,
-              -0.018315561,
-              -0.0054145255,
-              -0.09313447,
-              -0.061137658,
-              0.03881072,
-              0.02792733,
-              0.034151476,
-              -0.027465515,
-              0.010710185,
-              -0.055215303,
-              -0.073805,
-              0.021541798,
-              -0.015463418,
-              -0.024991987,
-              -0.004779671,
-              0.030454708,
-              -0.02407339,
-              0.034101877,
-              -0.010341885,
-              -0.012655972,
-              0.036309235,
-              -0.0044550677,
-              -0.014974223,
-              0.027874243,
-              0.09782822,
-              -0.026438858,
-              -0.005190334,
-              -0.019119462,
-              0.06202614,
-              0.052122016,
-              0.037861902,
-              0.012597777,
-              -1.7054827e-08,
-              -0.04997221,
-              -0.08913875,
-              -0.0035288178,
-              -0.015788937,
-              -0.021885982,
-              0.07185057,
-              -0.050171196,
-              -0.010661625,
-              -0.03058095,
-              -0.015772644,
-              0.01322944,
-              -0.0025733304,
-              -0.04212318,
-              0.009266956,
-              -0.041135434,
-              -0.029588273,
-              0.0021936113,
-              -0.033001017,
-              -0.050396364,
-              -0.02149836,
-              -0.0068135546,
-              0.008485492,
-              0.03569217,
-              0.025194813,
-              -0.016510937,
-              0.04917863,
-              0.018346637,
-              0.04907251,
-              -0.0582019,
-              -0.015061549,
-              0.04578192,
-              0.049921762,
-              0.02044503,
-              -0.052017137,
-              -0.033587772,
-              0.06185581,
-              0.11143413,
-              0.07770764,
-              0.02244692,
-              0.0025846648,
-              -0.04391288,
-              0.008592464,
-              -0.036181543,
-              0.0296719,
-              -0.017300868,
-              -0.094585225,
-              -0.05786905,
-              -0.065796606,
-              -0.061245505,
-              -0.104576424,
-              -0.029241998,
-              0.0013673713,
-              0.0060772314,
-              0.04078779,
-              -0.036728922,
-              0.016783627,
-              0.005292796,
-              0.030990785,
-              -0.054467708,
-              0.0048806495,
-              0.07091143,
-              0.06684519,
-              0.01770421,
-              -0.029248381
+              -0.028407024,
+              0.08176727,
+              -0.07856116,
+              0.027924549,
+              0.05008439,
+              -0.035268802,
+              -0.0040619136,
+              0.029315198,
+              -0.05775003,
+              0.013769637,
+              0.14610882,
+              -0.012019041,
+              -0.024392882,
+              -0.05509032,
+              -0.02661779,
+              -0.013253934,
+              -0.109151706,
+              -0.037233494,
+              -0.0036058167,
+              0.04766495,
+              0.06212885,
+              0.0070259646,
+              -0.015513743,
+              -0.008010851,
+              0.037648663,
+              0.01587603,
+              -0.041856695,
+              0.09732178,
+              -0.025641596,
+              -0.11368298,
+              0.03550726,
+              0.07043342,
+              0.016779423,
+              0.02220752,
+              0.123395406,
+              0.0077137193,
+              0.12550895,
+              0.008077936,
+              -0.026158499,
+              0.0028612812,
+              0.018155744,
+              -0.04666325,
+              0.041025575,
+              0.0013476727,
+              0.0019516364,
+              0.008663665,
+              0.016689047,
+              0.02200178,
+              0.0020768014,
+              -0.032861207,
+              -0.086455174,
+              0.008047145,
+              -0.07434091,
+              -0.016292974,
+              0.06051878,
+              0.005966867,
+              0.0160179,
+              0.021412006,
+              0.009540338,
+              0.03177335,
+              0.023032434,
+              0.03437097,
+              -0.04224765,
+              0.024748176,
+              0.116213955,
+              -0.024936162,
+              -0.03895259,
+              -0.024991278,
+              -0.020854436,
+              -0.08835937,
+              -0.15073228,
+              0.020921277,
+              -0.022518696,
+              0.0023868105,
+              0.0057663955,
+              -0.0015790414,
+              -0.11985628,
+              -0.0029912454,
+              0.0550998,
+              -0.11830636,
+              -0.058846988,
+              -0.15046737,
+              0.018624697,
+              -0.0093440395,
+              -0.028901154,
+              0.08400474,
+              0.0437436,
+              -0.0006745939,
+              -0.052540295,
+              0.00024754918,
+              0.040431518,
+              0.0066545215,
+              0.02609114,
+              0.051891107,
+              0.012606882,
+              0.061448827,
+              0.013889043,
+              0.038454182,
+              0.048222367,
+              0.104106456,
+              -0.026478294,
+              -0.021488149,
+              -0.020865437,
+              0.05061779,
+              -0.05171592,
+              -0.07573864,
+              0.057483904,
+              -0.049993664,
+              0.06528295,
+              -0.02875688,
+              0.038766492,
+              -0.062760465,
+              -0.0144796055,
+              -0.063462086,
+              0.06642258,
+              -0.014848135,
+              -0.03523116,
+              0.0774014,
+              -0.039893247,
+              0.032182425,
+              0.10171478,
+              -0.022525396,
+              -0.059299074,
+              0.00038746602,
+              -0.05779858,
+              -0.07034273,
+              0.06375495,
+              -4.088634e-33,
+              -0.021801252,
+              -0.07985834,
+              -0.013881648,
+              0.14923096,
+              0.02520313,
+              -0.042283125,
+              -0.0067697223,
+              0.054634638,
+              -0.09223034,
+              0.0081036305,
+              -0.03861765,
+              -0.117698364,
+              0.012977803,
+              0.034548674,
+              -0.01703291,
+              0.011910173,
+              0.012945288,
+              0.04277919,
+              -0.017591223,
+              -0.0184066,
+              0.06513148,
+              0.04050013,
+              -0.02252127,
+              -0.060939074,
+              -0.018603502,
+              0.011679816,
+              0.01410369,
+              -0.06763908,
+              0.08543174,
+              0.030138582,
+              0.010859261,
+              -0.054844614,
+              -0.024129191,
+              0.048327282,
+              0.00750549,
+              0.013356204,
+              0.024558878,
+              -0.005942624,
+              -0.045620095,
+              -0.00484637,
+              0.004418298,
+              -0.0023806267,
+              0.013590539,
+              -0.016870445,
+              0.06959721,
+              -0.07736302,
+              0.02058481,
+              0.0048155314,
+              0.055696823,
+              0.0131223425,
+              -0.011748222,
+              0.040935397,
+              0.007458848,
+              0.042072233,
+              0.010358565,
+              0.019406458,
+              0.011092792,
+              0.017259602,
+              0.018278012,
+              0.077335365,
+              0.019612921,
+              0.05268688,
+              -0.05863009,
+              0.039751627,
+              -0.050250556,
+              -0.048913844,
+              -0.05265637,
+              -0.09227304,
+              0.0755598,
+              0.08097828,
+              -0.022257954,
+              -0.042141132,
+              0.056546185,
+              0.023585746,
+              0.0015263582,
+              -0.049815144,
+              0.002336895,
+              0.028626408,
+              -0.06897293,
+              -0.04780049,
+              -0.048637427,
+              -0.076585636,
+              -0.03285766,
+              -0.046012525,
+              -0.0573021,
+              -0.080889866,
+              -0.008056378,
+              -0.0936112,
+              0.051229417,
+              -0.058302302,
+              -0.0005942833,
+              0.02222621,
+              -0.046907477,
+              -0.08964737,
+              0.1195762,
+              2.0452953e-33,
+              0.012159685,
+              0.086426094,
+              -0.023217503,
+              0.002771192,
+              -0.0010614472,
+              0.03487195,
+              0.07328719,
+              -0.049876485,
+              -0.041938163,
+              0.13486409,
+              -0.00690217,
+              0.006254477,
+              0.059122436,
+              -0.028893106,
+              0.09141587,
+              -0.018487127,
+              0.0077112317,
+              -0.044207573,
+              -0.0251735,
+              -0.014999972,
+              -0.035417248,
+              0.12413253,
+              0.13118097,
+              0.081015825,
+              -0.03327241,
+              0.003976432,
+              0.026454262,
+              0.026598025,
+              0.017349144,
+              -0.0036153824,
+              0.035460044,
+              0.05956128,
+              -0.124593176,
+              0.021954069,
+              0.025635097,
+              -0.11063109,
+              0.096061416,
+              -0.06731725,
+              -0.011819293,
+              0.042329434,
+              0.03790837,
+              0.10582649,
+              0.0073426333,
+              0.06629678,
+              0.022922922,
+              0.0494007,
+              0.14639522,
+              -0.0067070075,
+              0.004380622,
+              -0.029196544,
+              -0.009010303,
+              -0.08637028,
+              0.03588363,
+              0.0029887543,
+              -0.029351206,
+              0.07019312,
+              0.014898416,
+              0.028345235,
+              -0.040354595,
+              0.01916304,
+              0.015590835,
+              0.028637327,
+              -0.019529723,
+              -0.018309733,
+              -0.0054176697,
+              -0.093132764,
+              -0.06116049,
+              0.038816936,
+              0.02793884,
+              0.034137025,
+              -0.027511358,
+              0.010699668,
+              -0.05521562,
+              -0.07380209,
+              0.021521263,
+              -0.015450832,
+              -0.024988633,
+              -0.004755674,
+              0.030465573,
+              -0.024057997,
+              0.0341225,
+              -0.0103128245,
+              -0.012666524,
+              0.03628323,
+              -0.0044518244,
+              -0.014977736,
+              0.02790076,
+              0.0978009,
+              -0.026436698,
+              -0.005187212,
+              -0.019124882,
+              0.06205225,
+              0.052137945,
+              0.037870288,
+              0.012578256,
+              -1.705626e-08,
+              -0.05000592,
+              -0.08913878,
+              -0.0035273295,
+              -0.01577607,
+              -0.021846429,
+              0.07184407,
+              -0.050185654,
+              -0.010643527,
+              -0.030602882,
+              -0.01577121,
+              0.013220822,
+              -0.0025653532,
+              -0.04210823,
+              0.009286525,
+              -0.041129403,
+              -0.029615805,
+              0.002200794,
+              -0.032989334,
+              -0.05041253,
+              -0.021504797,
+              -0.0068345494,
+              0.0084738685,
+              0.03568697,
+              0.0252117,
+              -0.016504692,
+              0.04915123,
+              0.018349955,
+              0.049084183,
+              -0.058165494,
+              -0.015055481,
+              0.045743454,
+              0.049920842,
+              0.020444298,
+              -0.052004594,
+              -0.033592116,
+              0.061816722,
+              0.111411005,
+              0.07770497,
+              0.022457859,
+              0.0025742552,
+              -0.043929543,
+              0.008576763,
+              -0.036182683,
+              0.029673496,
+              -0.017278075,
+              -0.09458994,
+              -0.057882637,
+              -0.06579892,
+              -0.06124832,
+              -0.10455079,
+              -0.02925637,
+              0.0013624659,
+              0.0060532107,
+              0.04077331,
+              -0.036694046,
+              0.016800206,
+              0.005279432,
+              0.030968234,
+              -0.05446385,
+              0.0048696757,
+              0.070877954,
+              0.06684445,
+              0.017715273,
+              -0.029237686
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/e2c9b07709fe.json b/tests/integration/recordings/responses/e2c9b07709fe.json
index 47fa23233..0bab360ba 100644
--- a/tests/integration/recordings/responses/e2c9b07709fe.json
+++ b/tests/integration/recordings/responses/e2c9b07709fe.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -22,14 +22,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-494",
+        "id": "chatcmpl-662",
         "choices": [
           {
             "finish_reason": "length",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "To test the OpenAI API with a temperature of 1, you can use the following Python code:\n\n```python\nimport requests\n\ndef generate_text(model_name, prompt, temperature=1):\n    # Set the API endpoint and parameters\n    url = \"https://api.openai.com/v1/models/\" + model_name + \"/generate\"\n    params = {\n        \"prompt\": prompt,\n        \"temperature\": temperature\n    }\n\n    # Send a GET request to the API\n    response =",
+              "content": "To test the prompt understanding of OpenAI's text generation capabilities, I'll simulate a conversation. \n\nYou mentioned testing the model with a temperature setting of 1. The temperature parameter in OpenAI's text models controls the diversity and coherence of generated text.\n\nA temperature of 1 is considered \"colder\" than usual, meaning the model will generate more coherent but potentially less diverse text compared to higher temperatures (e.g., 0.5 or 0.7).\n\nPlease provide a prompt for",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -39,7 +39,7 @@
             }
           }
         ],
-        "created": 1754510067,
+        "created": 1756921259,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
diff --git a/tests/integration/recordings/responses/e96152610712.json b/tests/integration/recordings/responses/e96152610712.json
index b55e02825..aa758da0d 100644
--- a/tests/integration/recordings/responses/e96152610712.json
+++ b/tests/integration/recordings/responses/e96152610712.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:51.421145Z",
+        "created_at": "2025-09-03T17:37:33.16899Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 201670125,
-        "load_duration": 70275459,
+        "total_duration": 300698625,
+        "load_duration": 179823875,
         "prompt_eval_count": 207,
-        "prompt_eval_duration": 71000000,
+        "prompt_eval_duration": 65083666,
         "eval_count": 5,
-        "eval_duration": 58000000,
+        "eval_duration": 55216084,
         "response": "unsafe\nS2",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/e9c8a0e4f0e0.json b/tests/integration/recordings/responses/e9c8a0e4f0e0.json
index 85adb5734..87a208405 100644
--- a/tests/integration/recordings/responses/e9c8a0e4f0e0.json
+++ b/tests/integration/recordings/responses/e9c8a0e4f0e0.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -20,14 +20,14 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-57",
+        "id": "chatcmpl-957",
         "choices": [
           {
             "finish_reason": "stop",
             "index": 0,
             "logprobs": null,
             "message": {
-              "content": "Humans live on Earth. It is the third planet from the Sun and is the only known planet in the universe that currently supports human life.",
+              "content": "Humans live on Earth. It's a terrestrial planet in the Solar System, located in the outer reaches of the Sun's gravitational pull.",
               "refusal": null,
               "role": "assistant",
               "annotations": null,
@@ -37,15 +37,15 @@
             }
           }
         ],
-        "created": 1754081845,
+        "created": 1756921355,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
         "system_fingerprint": "fp_ollama",
         "usage": {
-          "completion_tokens": 29,
+          "completion_tokens": 28,
           "prompt_tokens": 32,
-          "total_tokens": 61,
+          "total_tokens": 60,
           "completion_tokens_details": null,
           "prompt_tokens_details": null
         }
diff --git a/tests/integration/recordings/responses/ed9e9b34008d.json b/tests/integration/recordings/responses/ed9e9b34008d.json
index ae46f481a..d0591dbc1 100644
--- a/tests/integration/recordings/responses/ed9e9b34008d.json
+++ b/tests/integration/recordings/responses/ed9e9b34008d.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama3.2:3b-instruct-fp16",
-        "created_at": "2025-07-31T17:50:48.719062652Z",
+        "created_at": "2025-09-03T17:39:48.030217Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 42572007410,
-        "load_duration": 42791399,
+        "total_duration": 9760536750,
+        "load_duration": 242188583,
         "prompt_eval_count": 26,
-        "prompt_eval_duration": 1301967184,
+        "prompt_eval_duration": 83819333,
         "eval_count": 232,
-        "eval_duration": 41226696354,
+        "eval_duration": 9434009042,
         "response": "The largest planet in our solar system is Jupiter. It is a gas giant, meaning it is primarily composed of hydrogen and helium gases. Jupiter has a diameter of approximately 142,984 kilometers (88,846 miles), which is more than 11 times the diameter of Earth.\n\nJupiter is not only the largest planet in terms of size, but also the most massive planet in our solar system, with a mass that is more than 318 times that of Earth. It has a thick atmosphere and a strong magnetic field, and is known for its distinctive banded appearance, which is caused by strong winds in the upper atmosphere.\n\nJupiter's massive size and gravitational pull have a significant impact on the surrounding space, including the orbits of nearby planets and asteroids. Its moons are also notable, with four large ones: Io, Europa, Ganymede, and Callisto, which are known as the Galilean moons due to their discovery by Galileo Galilei in 1610.\n\nJupiter is a fascinating planet that continues to be studied by astronomers and space agencies around the world, offering insights into the formation and evolution of our solar system.",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/eee47930e3ae.json b/tests/integration/recordings/responses/eee47930e3ae.json
index 20ec83476..283416a09 100644
--- a/tests/integration/recordings/responses/eee47930e3ae.json
+++ b/tests/integration/recordings/responses/eee47930e3ae.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:23.842191Z",
+          "created_at": "2025-09-03T17:38:04.631107Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:23.903756Z",
+          "created_at": "2025-09-03T17:38:04.673105Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:23.962295Z",
+          "created_at": "2025-09-03T17:38:04.714459Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.019479Z",
+          "created_at": "2025-09-03T17:38:04.755882Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.076158Z",
+          "created_at": "2025-09-03T17:38:04.797494Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.142903Z",
+          "created_at": "2025-09-03T17:38:04.839382Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.202616Z",
+          "created_at": "2025-09-03T17:38:04.881062Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.25501Z",
+          "created_at": "2025-09-03T17:38:04.921976Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.308017Z",
+          "created_at": "2025-09-03T17:38:04.962922Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.360014Z",
+          "created_at": "2025-09-03T17:38:05.00411Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.413785Z",
+          "created_at": "2025-09-03T17:38:05.04532Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.466618Z",
+          "created_at": "2025-09-03T17:38:05.086979Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,7 +238,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.519141Z",
+          "created_at": "2025-09-03T17:38:05.128195Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -256,7 +256,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.572343Z",
+          "created_at": "2025-09-03T17:38:05.169221Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -274,7 +274,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.626495Z",
+          "created_at": "2025-09-03T17:38:05.210938Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -292,7 +292,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.683554Z",
+          "created_at": "2025-09-03T17:38:05.252232Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -310,7 +310,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.736715Z",
+          "created_at": "2025-09-03T17:38:05.293529Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -328,7 +328,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.789545Z",
+          "created_at": "2025-09-03T17:38:05.334965Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -346,15 +346,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:24.842095Z",
+          "created_at": "2025-09-03T17:38:05.376741Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1141228125,
-          "load_duration": 38375333,
+          "total_duration": 936717042,
+          "load_duration": 109245542,
           "prompt_eval_count": 371,
-          "prompt_eval_duration": 99000000,
+          "prompt_eval_duration": 80430583,
           "eval_count": 19,
-          "eval_duration": 1002000000,
+          "eval_duration": 746422917,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/ef59cbff54d0.json b/tests/integration/recordings/responses/ef59cbff54d0.json
index e16cf605c..559930873 100644
--- a/tests/integration/recordings/responses/ef59cbff54d0.json
+++ b/tests/integration/recordings/responses/ef59cbff54d0.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:12:54.110896Z",
+        "created_at": "2025-09-03T17:37:35.524155Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 219323916,
-        "load_duration": 109411750,
+        "total_duration": 251173708,
+        "load_duration": 165988125,
         "prompt_eval_count": 213,
-        "prompt_eval_duration": 86000000,
+        "prompt_eval_duration": 73363375,
         "eval_count": 2,
-        "eval_duration": 22000000,
+        "eval_duration": 11249792,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/responses/ef757a75ed08.json b/tests/integration/recordings/responses/ef757a75ed08.json
index b2d68f4d6..05860c4bb 100644
--- a/tests/integration/recordings/responses/ef757a75ed08.json
+++ b/tests/integration/recordings/responses/ef757a75ed08.json
@@ -21,7 +21,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.212563Z",
+          "created_at": "2025-09-03T17:34:22.272912Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -39,7 +39,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.254896Z",
+          "created_at": "2025-09-03T17:34:22.31501Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -57,7 +57,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.297152Z",
+          "created_at": "2025-09-03T17:34:22.356888Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.339477Z",
+          "created_at": "2025-09-03T17:34:22.398576Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -93,7 +93,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.382245Z",
+          "created_at": "2025-09-03T17:34:22.440412Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -111,7 +111,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.423387Z",
+          "created_at": "2025-09-03T17:34:22.482165Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -129,7 +129,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.465286Z",
+          "created_at": "2025-09-03T17:34:22.523773Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -147,7 +147,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.507249Z",
+          "created_at": "2025-09-03T17:34:22.565072Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -165,15 +165,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-07-29T23:46:35.549072Z",
+          "created_at": "2025-09-03T17:34:22.607117Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 5519843458,
-          "load_duration": 4110366375,
+          "total_duration": 1386049708,
+          "load_duration": 96970583,
           "prompt_eval_count": 456,
-          "prompt_eval_duration": 1070783708,
+          "prompt_eval_duration": 952471625,
           "eval_count": 9,
-          "eval_duration": 337120750,
+          "eval_duration": 335924459,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/vision/responses/f1592dee71e5.json b/tests/integration/recordings/responses/f1592dee71e5.json
similarity index 99%
rename from tests/integration/recordings/vision/responses/f1592dee71e5.json
rename to tests/integration/recordings/responses/f1592dee71e5.json
index a30aa460b..d95497ee2 100644
--- a/tests/integration/recordings/vision/responses/f1592dee71e5.json
+++ b/tests/integration/recordings/responses/f1592dee71e5.json
@@ -30,18 +30,18 @@
       "__type__": "ollama._types.ChatResponse",
       "__data__": {
         "model": "llama3.2-vision:11b",
-        "created_at": "2025-08-01T00:06:12.068973125Z",
+        "created_at": "2025-09-03T17:54:32.086616Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 44793549354,
-        "load_duration": 51960915,
+        "total_duration": 3537246333,
+        "load_duration": 130547125,
         "prompt_eval_count": 18,
-        "prompt_eval_duration": 579363429,
-        "eval_count": 110,
-        "eval_duration": 44156162976,
+        "prompt_eval_duration": 140216250,
+        "eval_count": 56,
+        "eval_duration": 3262609875,
         "message": {
           "role": "assistant",
-          "content": "The image features a close-up of a golden retriever puppy, with its mouth open and tongue out, as if it is smiling or panting. The puppy's fur is a light golden color, and its ears are floppy and hanging down on either side of its head. The background of the image is blurred, but it appears to be a natural setting, possibly a field or a park, with a greenish-yellow color. The overall atmosphere of the image is one of happiness and playfulness, as the puppy seems to be enjoying itself.",
+          "content": "The image is of a golden retriever puppy. The puppy is looking directly at the camera with its mouth open and tongue out. The puppy is white with golden ears and a black nose. The background is out of focus, but it appears to be a grassy field.",
           "thinking": null,
           "images": null,
           "tool_calls": null
diff --git a/tests/integration/recordings/responses/f477c2fe1332.json b/tests/integration/recordings/responses/f477c2fe1332.json
index 2e29690ee..d3c8e7176 100644
--- a/tests/integration/recordings/responses/f477c2fe1332.json
+++ b/tests/integration/recordings/responses/f477c2fe1332.json
@@ -22,7 +22,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.046199Z",
+          "created_at": "2025-09-03T17:42:31.583665Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -40,7 +40,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.097228Z",
+          "created_at": "2025-09-03T17:42:31.625653Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -58,7 +58,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.147575Z",
+          "created_at": "2025-09-03T17:42:31.667189Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -76,7 +76,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.199038Z",
+          "created_at": "2025-09-03T17:42:31.708905Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -94,7 +94,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.25106Z",
+          "created_at": "2025-09-03T17:42:31.751003Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -112,7 +112,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.302712Z",
+          "created_at": "2025-09-03T17:42:31.792516Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -130,7 +130,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.355658Z",
+          "created_at": "2025-09-03T17:42:31.834194Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -148,7 +148,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.407436Z",
+          "created_at": "2025-09-03T17:42:31.878321Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -166,7 +166,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.459062Z",
+          "created_at": "2025-09-03T17:42:31.921552Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -184,7 +184,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.511804Z",
+          "created_at": "2025-09-03T17:42:31.963105Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -202,7 +202,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.562406Z",
+          "created_at": "2025-09-03T17:42:32.005494Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -220,7 +220,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.614648Z",
+          "created_at": "2025-09-03T17:42:32.047231Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -238,7 +238,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.665414Z",
+          "created_at": "2025-09-03T17:42:32.089031Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -256,7 +256,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.71826Z",
+          "created_at": "2025-09-03T17:42:32.130704Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -274,7 +274,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.769822Z",
+          "created_at": "2025-09-03T17:42:32.172183Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -292,7 +292,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.821049Z",
+          "created_at": "2025-09-03T17:42:32.21392Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -310,7 +310,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.872903Z",
+          "created_at": "2025-09-03T17:42:32.255392Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -328,7 +328,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.924976Z",
+          "created_at": "2025-09-03T17:42:32.297249Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -346,7 +346,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:37.976776Z",
+          "created_at": "2025-09-03T17:42:32.341358Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -364,7 +364,7 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.029285Z",
+          "created_at": "2025-09-03T17:42:32.384155Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -382,15 +382,15 @@
         "__type__": "ollama._types.GenerateResponse",
         "__data__": {
           "model": "llama3.2:3b-instruct-fp16",
-          "created_at": "2025-08-01T23:14:38.084154Z",
+          "created_at": "2025-09-03T17:42:32.426441Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 1782717042,
-          "load_duration": 78612834,
+          "total_duration": 1659557917,
+          "load_duration": 75341875,
           "prompt_eval_count": 375,
-          "prompt_eval_duration": 658000000,
+          "prompt_eval_duration": 740178250,
           "eval_count": 21,
-          "eval_duration": 1044000000,
+          "eval_duration": 843394541,
           "response": "",
           "thinking": null,
           "context": null
diff --git a/tests/integration/recordings/responses/f6d655e91ac3.json b/tests/integration/recordings/responses/f6d655e91ac3.json
index 1dd1010b1..185fff181 100644
--- a/tests/integration/recordings/responses/f6d655e91ac3.json
+++ b/tests/integration/recordings/responses/f6d655e91ac3.json
@@ -20,390 +20,390 @@
         "data": [
           {
             "embedding": [
-              -0.034272887,
-              0.0900405,
-              -0.114585444,
-              0.0021513691,
-              0.059019327,
-              -0.02748151,
-              -0.020571338,
-              0.03373777,
-              -0.03872984,
-              0.026010917,
-              0.1147871,
-              0.027154561,
-              -0.015938662,
-              -0.02185328,
-              -0.046722047,
-              -0.04638079,
-              -0.07416656,
-              -0.052859545,
-              -0.028124748,
-              0.06325527,
-              0.029144203,
-              0.047097813,
-              -0.05268828,
-              -0.0053592497,
-              0.030669667,
-              0.01769888,
-              -0.01687185,
-              0.08683223,
-              -0.014155632,
-              -0.08387485,
-              0.019995376,
-              0.07114902,
-              0.08367812,
-              0.030923046,
-              0.11826658,
-              0.028755534,
-              0.06955482,
-              -0.017287154,
-              -0.005806163,
-              0.005812646,
-              0.0011825147,
-              -0.06533827,
-              0.037360404,
-              0.018541763,
-              -0.0034888012,
-              -0.0011040586,
-              -0.029778237,
-              -0.021269588,
-              0.005844319,
-              -0.035600223,
-              -0.037232384,
-              0.012353592,
-              -0.06692711,
-              -0.023162046,
-              0.05686014,
-              0.0014791423,
-              0.01440185,
-              -0.017189784,
-              0.009246685,
-              0.06083274,
-              0.024673132,
-              0.036989614,
-              -0.050630055,
-              0.051760096,
-              0.10160539,
-              0.008477512,
-              -0.048004184,
-              -0.013003718,
-              0.031101642,
-              -0.1659611,
-              -0.14100891,
-              0.009773047,
-              -0.025983926,
-              0.05229989,
-              -0.007893064,
-              0.0078570945,
-              -0.08468617,
-              -0.044539623,
-              0.054151334,
-              -0.07042244,
-              -0.05768138,
-              -0.10078619,
-              0.021822996,
-              0.022160508,
-              0.0072028935,
-              0.13064505,
-              0.08020654,
-              -0.0044225734,
-              -0.018743401,
-              0.0075993463,
-              -0.031649683,
-              0.031955328,
-              -0.022171712,
-              0.030735254,
-              -0.023809722,
-              0.0695489,
-              0.016647533,
-              0.0095261615,
-              0.027464647,
-              0.10212388,
-              0.02145324,
-              -0.021429047,
-              0.015128828,
-              0.039440226,
-              -0.09434037,
-              -0.11546961,
-              0.09468322,
-              -0.011139115,
-              0.072680146,
-              -0.03602365,
-              -0.011743472,
-              -0.066524595,
-              -0.034747,
-              -0.10301544,
-              0.030228501,
-              -0.06316883,
-              -0.090848505,
-              0.041170754,
-              -0.03368485,
-              0.045751248,
-              0.07133673,
-              -0.031778056,
-              -0.05968261,
-              -0.017208954,
-              -0.032287136,
-              -0.058584064,
-              0.0673487,
-              -5.023248e-33,
-              -0.005809502,
-              -0.071970925,
-              -0.00930889,
-              0.09656616,
-              0.037086118,
-              -0.034771495,
-              -0.00472216,
-              0.016682126,
-              -0.098648354,
-              0.005475455,
-              -0.014123589,
-              -0.08407786,
-              0.0027178645,
-              0.04443311,
-              -0.01269345,
-              0.034540884,
-              -0.0005944164,
-              0.06320702,
-              -0.026761396,
-              -0.013525239,
-              0.024135783,
-              0.015422592,
-              -0.04138039,
-              -0.05520989,
-              -0.06454275,
-              0.031492148,
-              -0.0072836457,
-              -0.039476894,
-              0.059850004,
-              0.026700241,
-              0.013972591,
-              -0.038822647,
-              -0.04851447,
-              0.017551823,
-              0.020952301,
-              0.03522171,
-              0.011540296,
-              -0.00842795,
-              -0.044636253,
-              0.014627958,
-              3.2639466e-05,
-              -0.046966836,
-              0.027031295,
-              0.006612757,
-              0.06439624,
-              -0.044763926,
-              -0.02612974,
-              -0.016271371,
-              0.055233188,
-              0.014105759,
-              -0.008459233,
-              0.04205111,
-              0.050489996,
-              0.021618336,
-              0.011294852,
-              0.0485963,
-              0.017674806,
-              -0.004992791,
-              0.00193088,
-              0.063277334,
-              0.035901506,
-              0.03502828,
-              -0.06643911,
-              0.008779193,
-              -0.027297689,
-              -0.059879173,
-              -0.027194038,
-              -0.087292045,
-              0.11242319,
-              0.05879699,
-              -0.041721053,
-              -0.069260724,
-              0.064383894,
-              0.015849635,
-              -0.027780458,
-              -0.03755858,
-              -0.011723025,
-              0.06948493,
-              -0.07109373,
-              -0.039075296,
-              -0.043134894,
-              -0.1120962,
-              -0.030726664,
-              -0.06376309,
-              -0.03524182,
-              -0.061186828,
-              -0.015275632,
-              -0.100939795,
-              0.047502656,
-              -0.08317205,
-              -0.0029857687,
-              0.013144553,
-              -0.056699008,
-              -0.05796209,
-              0.06137419,
-              2.7670645e-33,
-              0.003669078,
-              0.06695531,
-              -0.055944078,
-              0.025168538,
-              0.0147572905,
-              0.033805534,
-              0.0934766,
-              -0.010511114,
-              -0.046672594,
-              0.14254896,
-              -0.015461952,
-              0.0067206374,
-              0.07682516,
-              -0.045769565,
-              0.07989758,
-              0.0036198904,
-              0.023618277,
-              -0.06530977,
-              -0.04256109,
-              -0.025923597,
-              -0.07477869,
-              0.1001957,
-              0.1257842,
-              0.064083636,
-              -0.01666794,
-              0.014075608,
-              0.025267936,
-              0.0017376567,
-              -0.013351121,
-              0.0117214825,
-              0.037724674,
-              0.040572807,
-              -0.12054958,
-              0.024336847,
-              0.034385506,
-              -0.10165844,
-              0.11865242,
-              -0.035707537,
-              -0.012689929,
-              0.022641081,
-              0.039234713,
-              0.10621312,
-              0.010647405,
-              0.07653686,
-              0.020896297,
-              0.06464065,
-              0.08582743,
-              -0.03212417,
-              0.043577865,
-              0.01106648,
-              0.023217985,
-              -0.06711702,
-              0.05536062,
-              -0.008119422,
-              -0.0268995,
-              0.077022836,
-              -0.011600607,
-              0.04498788,
-              -0.024568135,
-              0.020904513,
-              -0.0016571331,
-              0.029054169,
-              -0.038968027,
-              -0.013624052,
-              -0.019825684,
-              -0.057037495,
-              -0.014532248,
-              0.010170884,
-              0.016871484,
-              0.012004644,
-              0.019911213,
-              0.019217802,
-              -0.06554125,
-              -0.050251007,
-              0.05082798,
-              -0.07560525,
-              -0.018781837,
-              -0.0122035425,
-              0.0019368301,
-              -0.00351373,
-              0.07000184,
-              -0.029289605,
-              -0.008412919,
-              0.04744267,
-              -0.00043944066,
-              -0.014024816,
-              -0.0035281784,
-              0.0844005,
-              -0.0015739133,
-              0.0016869568,
-              -0.023196274,
-              0.059908636,
-              0.019615034,
-              0.054351386,
-              0.012312578,
-              -1.5289404e-08,
-              -0.038118448,
-              -0.084228516,
-              -0.013602922,
-              -0.032792244,
-              -0.020994218,
-              0.08923806,
-              0.005445469,
-              -0.07045531,
-              -0.03966009,
-              -0.018226359,
-              0.05718637,
-              -0.026399894,
-              -0.098825626,
-              0.017524764,
-              -0.019498266,
-              -0.062369697,
-              -0.019561017,
-              -0.011198561,
-              -0.03005754,
-              0.010641676,
-              -0.005561297,
-              0.053242564,
-              0.04418294,
-              0.025771322,
-              0.005914542,
-              0.059626196,
-              0.06883921,
-              0.08894957,
-              -0.062240407,
-              -0.038899083,
-              0.028789395,
-              0.087763906,
-              0.017739464,
-              -0.050055157,
-              -0.0009801601,
-              0.1297665,
-              0.08312503,
-              0.08157199,
-              0.0117320195,
-              0.006869762,
-              -0.072692566,
-              -0.0019829427,
-              -0.018348025,
-              0.0088948505,
-              -0.038234424,
-              -0.09056964,
-              -0.06433111,
-              -0.042595394,
-              -0.030844258,
-              -0.09312696,
-              -0.043474108,
-              0.012029141,
-              -6.677036e-05,
-              0.040267132,
-              -0.049134284,
-              0.014589591,
-              0.017469455,
-              -0.005167336,
-              -0.03331327,
-              0.0075517776,
-              0.07486923,
-              0.0646153,
-              0.04480708,
-              -0.02847676
+              -0.03427073,
+              0.090051405,
+              -0.11458989,
+              0.0021456745,
+              0.059038658,
+              -0.027524853,
+              -0.020602634,
+              0.03373726,
+              -0.038729247,
+              0.026002944,
+              0.11481002,
+              0.027119067,
+              -0.015927644,
+              -0.021832926,
+              -0.046713773,
+              -0.0463825,
+              -0.074167565,
+              -0.0528447,
+              -0.028117927,
+              0.06325688,
+              0.029135453,
+              0.047131006,
+              -0.052675154,
+              -0.005349263,
+              0.030659368,
+              0.017706472,
+              -0.01687267,
+              0.08681507,
+              -0.014155131,
+              -0.0838676,
+              0.020020565,
+              0.07115838,
+              0.08365558,
+              0.030919788,
+              0.11829893,
+              0.028751066,
+              0.069536895,
+              -0.017295403,
+              -0.005784813,
+              0.005809313,
+              0.0012009157,
+              -0.0653044,
+              0.0373506,
+              0.018565746,
+              -0.0034945607,
+              -0.0011305016,
+              -0.029752811,
+              -0.021266408,
+              0.0058016903,
+              -0.035597492,
+              -0.03722647,
+              0.012373253,
+              -0.066935256,
+              -0.023148224,
+              0.056864377,
+              0.0014741909,
+              0.014408296,
+              -0.017165763,
+              0.009236472,
+              0.06087921,
+              0.024628488,
+              0.03699286,
+              -0.050610077,
+              0.05173448,
+              0.10159555,
+              0.008507267,
+              -0.04803921,
+              -0.013024803,
+              0.03110457,
+              -0.16593884,
+              -0.1410075,
+              0.009813814,
+              -0.025974236,
+              0.05233053,
+              -0.0078903325,
+              0.00788491,
+              -0.08471812,
+              -0.044507448,
+              0.054161046,
+              -0.0704361,
+              -0.05769206,
+              -0.100796975,
+              0.02182441,
+              0.022125391,
+              0.0071617346,
+              0.13063926,
+              0.080232956,
+              -0.004421626,
+              -0.018768508,
+              0.0076132733,
+              -0.03163366,
+              0.031986494,
+              -0.022168567,
+              0.03073627,
+              -0.023798423,
+              0.06954045,
+              0.016659362,
+              0.009536805,
+              0.027459558,
+              0.102133445,
+              0.021457382,
+              -0.021377807,
+              0.015131543,
+              0.039423607,
+              -0.09434147,
+              -0.11544392,
+              0.09468138,
+              -0.011155598,
+              0.07266597,
+              -0.03601087,
+              -0.011743829,
+              -0.06654009,
+              -0.03470551,
+              -0.10300434,
+              0.03020924,
+              -0.06319472,
+              -0.0908424,
+              0.04116676,
+              -0.033686537,
+              0.045706224,
+              0.07134009,
+              -0.031778418,
+              -0.059655976,
+              -0.017215038,
+              -0.03229557,
+              -0.058579948,
+              0.06733934,
+              -5.023814e-33,
+              -0.0058283503,
+              -0.0719842,
+              -0.009296622,
+              0.09659216,
+              0.03709538,
+              -0.03478395,
+              -0.004713233,
+              0.016686605,
+              -0.09859812,
+              0.00547005,
+              -0.014113569,
+              -0.0840751,
+              0.0027168505,
+              0.04445616,
+              -0.012728728,
+              0.034566686,
+              -0.0006014651,
+              0.06319148,
+              -0.026799418,
+              -0.013500979,
+              0.024169419,
+              0.015417236,
+              -0.04135526,
+              -0.055208974,
+              -0.06455241,
+              0.03148543,
+              -0.0073052812,
+              -0.03945437,
+              0.059831504,
+              0.026674163,
+              0.01396753,
+              -0.038841277,
+              -0.048514687,
+              0.01756627,
+              0.020964677,
+              0.035239976,
+              0.0115498835,
+              -0.00846713,
+              -0.044673763,
+              0.014640657,
+              5.2045852e-05,
+              -0.04694704,
+              0.02703366,
+              0.006635295,
+              0.064396136,
+              -0.044757996,
+              -0.026173549,
+              -0.016282372,
+              0.05521396,
+              0.014104745,
+              -0.008479494,
+              0.04204778,
+              0.05049772,
+              0.021629427,
+              0.011260506,
+              0.04858872,
+              0.017662494,
+              -0.005005865,
+              0.0019118759,
+              0.06333162,
+              0.035875723,
+              0.03504778,
+              -0.06642375,
+              0.008791644,
+              -0.027326671,
+              -0.05987137,
+              -0.0272001,
+              -0.08728625,
+              0.112434424,
+              0.05879801,
+              -0.041698616,
+              -0.06924583,
+              0.06434144,
+              0.01583225,
+              -0.027750073,
+              -0.037574448,
+              -0.011715211,
+              0.0694801,
+              -0.07104981,
+              -0.039085716,
+              -0.043068763,
+              -0.11208956,
+              -0.030723054,
+              -0.063793585,
+              -0.03527373,
+              -0.06119042,
+              -0.01526633,
+              -0.10094421,
+              0.047486804,
+              -0.08320468,
+              -0.0029513796,
+              0.0131224785,
+              -0.056690685,
+              -0.057956036,
+              0.06140136,
+              2.7669969e-33,
+              0.0036719525,
+              0.06695694,
+              -0.05591421,
+              0.025166295,
+              0.014735592,
+              0.03381445,
+              0.09345791,
+              -0.01053347,
+              -0.046693947,
+              0.14254177,
+              -0.015430197,
+              0.0066938214,
+              0.07679359,
+              -0.045779705,
+              0.07989786,
+              0.0036165903,
+              0.023604553,
+              -0.06533708,
+              -0.04253485,
+              -0.025912313,
+              -0.0748119,
+              0.10020777,
+              0.12578633,
+              0.06409652,
+              -0.016682886,
+              0.01406972,
+              0.025274348,
+              0.0017218525,
+              -0.013340701,
+              0.01172295,
+              0.03772902,
+              0.040607873,
+              -0.120578945,
+              0.024344057,
+              0.03439985,
+              -0.10167353,
+              0.11863072,
+              -0.03571693,
+              -0.0126576,
+              0.022622129,
+              0.039235484,
+              0.10625315,
+              0.0106492825,
+              0.076503076,
+              0.02088746,
+              0.06468519,
+              0.08582322,
+              -0.032148413,
+              0.04359905,
+              0.011070053,
+              0.023209164,
+              -0.06709916,
+              0.055355705,
+              -0.008128262,
+              -0.026921155,
+              0.076995976,
+              -0.011614669,
+              0.044967294,
+              -0.02459807,
+              0.020910041,
+              -0.0016746842,
+              0.02905443,
+              -0.03898753,
+              -0.01360213,
+              -0.019878393,
+              -0.057056017,
+              -0.014543598,
+              0.010161744,
+              0.016893594,
+              0.011981163,
+              0.019902436,
+              0.019194229,
+              -0.06551642,
+              -0.050247267,
+              0.050837662,
+              -0.075614415,
+              -0.018767305,
+              -0.012229684,
+              0.0019464786,
+              -0.0035209567,
+              0.0699799,
+              -0.02925182,
+              -0.008455151,
+              0.04742619,
+              -0.0004527954,
+              -0.014011262,
+              -0.0035493495,
+              0.08439228,
+              -0.001586065,
+              0.0016962147,
+              -0.023180604,
+              0.059889086,
+              0.019616995,
+              0.05435093,
+              0.012301163,
+              -1.5289881e-08,
+              -0.038103975,
+              -0.084179275,
+              -0.013605872,
+              -0.03277629,
+              -0.020995136,
+              0.08924277,
+              0.005438667,
+              -0.07047066,
+              -0.03966912,
+              -0.018226335,
+              0.05716885,
+              -0.026391266,
+              -0.09881308,
+              0.017511,
+              -0.01952465,
+              -0.06237397,
+              -0.019553065,
+              -0.0112019945,
+              -0.030052405,
+              0.010624359,
+              -0.005598304,
+              0.05326868,
+              0.044162616,
+              0.025812192,
+              0.0059228353,
+              0.059632093,
+              0.06885661,
+              0.08894283,
+              -0.06225795,
+              -0.038893122,
+              0.028817136,
+              0.08772772,
+              0.017759481,
+              -0.050048865,
+              -0.0009810333,
+              0.1297453,
+              0.083138496,
+              0.08161095,
+              0.011747931,
+              0.006871316,
+              -0.07277484,
+              -0.0020051182,
+              -0.018357608,
+              0.008882652,
+              -0.03823878,
+              -0.09057624,
+              -0.06433315,
+              -0.04256367,
+              -0.030856675,
+              -0.09314087,
+              -0.043470908,
+              0.012043298,
+              -9.8401986e-05,
+              0.040246293,
+              -0.04912119,
+              0.014575804,
+              0.017479645,
+              -0.00515073,
+              -0.033331197,
+              0.0075505474,
+              0.07488009,
+              0.06460031,
+              0.044803377,
+              -0.028485151
             ],
             "index": 0,
             "object": "embedding"
diff --git a/tests/integration/recordings/responses/f70f30f54211.json b/tests/integration/recordings/responses/f70f30f54211.json
index e0ea9c016..c4dd90e68 100644
--- a/tests/integration/recordings/responses/f70f30f54211.json
+++ b/tests/integration/recordings/responses/f70f30f54211.json
@@ -1,7 +1,7 @@
 {
   "request": {
     "method": "POST",
-    "url": "http://localhost:11434/v1/v1/chat/completions",
+    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
     "headers": {},
     "body": {
       "model": "llama3.2:3b-instruct-fp16",
@@ -38,7 +38,7 @@
     "body": {
       "__type__": "openai.types.chat.chat_completion.ChatCompletion",
       "__data__": {
-        "id": "chatcmpl-549",
+        "id": "chatcmpl-10",
         "choices": [
           {
             "finish_reason": "tool_calls",
@@ -53,7 +53,7 @@
               "function_call": null,
               "tool_calls": [
                 {
-                  "id": "call_ybj7t2qt",
+                  "id": "call_7cm57k1b",
                   "function": {
                     "arguments": "{\"city\":\"Tokyo\"}",
                     "name": "get_weather"
@@ -65,7 +65,7 @@
             }
           }
         ],
-        "created": 1754081857,
+        "created": 1756921368,
         "model": "llama3.2:3b-instruct-fp16",
         "object": "chat.completion",
         "service_tier": null,
diff --git a/tests/integration/recordings/responses/fcdef245da95.json b/tests/integration/recordings/responses/fcdef245da95.json
index 04606b914..d2801b9c6 100644
--- a/tests/integration/recordings/responses/fcdef245da95.json
+++ b/tests/integration/recordings/responses/fcdef245da95.json
@@ -20,15 +20,15 @@
       "__type__": "ollama._types.GenerateResponse",
       "__data__": {
         "model": "llama-guard3:1b",
-        "created_at": "2025-08-01T23:13:55.309172Z",
+        "created_at": "2025-09-03T17:37:44.986629Z",
         "done": true,
         "done_reason": "stop",
-        "total_duration": 2252068541,
-        "load_duration": 240932958,
+        "total_duration": 285693167,
+        "load_duration": 110888542,
         "prompt_eval_count": 212,
-        "prompt_eval_duration": 1979000000,
+        "prompt_eval_duration": 163158250,
         "eval_count": 2,
-        "eval_duration": 25000000,
+        "eval_duration": 11080125,
         "response": "safe",
         "thinking": null,
         "context": null
diff --git a/tests/integration/recordings/vision/responses/ff7db0102b28.json b/tests/integration/recordings/responses/ff7db0102b28.json
similarity index 98%
rename from tests/integration/recordings/vision/responses/ff7db0102b28.json
rename to tests/integration/recordings/responses/ff7db0102b28.json
index 160e0a607..f1866d1f4 100644
--- a/tests/integration/recordings/vision/responses/ff7db0102b28.json
+++ b/tests/integration/recordings/responses/ff7db0102b28.json
@@ -31,7 +31,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:49.339347876Z",
+          "created_at": "2025-09-03T17:54:22.358461Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -53,7 +53,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:49.747466769Z",
+          "created_at": "2025-09-03T17:54:22.416981Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -75,7 +75,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:50.156146804Z",
+          "created_at": "2025-09-03T17:54:22.477481Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -97,7 +97,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:50.566195243Z",
+          "created_at": "2025-09-03T17:54:22.53807Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -119,7 +119,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:50.975121211Z",
+          "created_at": "2025-09-03T17:54:22.59701Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -141,7 +141,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:51.388779549Z",
+          "created_at": "2025-09-03T17:54:22.655848Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -163,7 +163,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:51.79897453Z",
+          "created_at": "2025-09-03T17:54:22.715363Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -185,7 +185,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:52.209608504Z",
+          "created_at": "2025-09-03T17:54:22.773865Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -207,7 +207,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:52.619045995Z",
+          "created_at": "2025-09-03T17:54:22.832338Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -229,7 +229,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:53.026501007Z",
+          "created_at": "2025-09-03T17:54:22.890824Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -251,7 +251,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:53.436015071Z",
+          "created_at": "2025-09-03T17:54:22.949237Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -273,7 +273,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:53.843369446Z",
+          "created_at": "2025-09-03T17:54:23.008374Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -295,7 +295,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:54.255794451Z",
+          "created_at": "2025-09-03T17:54:23.066921Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -317,7 +317,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:54.663263793Z",
+          "created_at": "2025-09-03T17:54:23.125544Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -339,7 +339,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:55.073162133Z",
+          "created_at": "2025-09-03T17:54:23.184923Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -361,7 +361,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:55.48667439Z",
+          "created_at": "2025-09-03T17:54:23.244278Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -383,7 +383,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:55.897947147Z",
+          "created_at": "2025-09-03T17:54:23.303383Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -405,7 +405,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:56.31639321Z",
+          "created_at": "2025-09-03T17:54:23.36246Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -427,7 +427,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:56.729288843Z",
+          "created_at": "2025-09-03T17:54:23.421703Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -449,7 +449,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:57.142647132Z",
+          "created_at": "2025-09-03T17:54:23.481027Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -471,7 +471,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:57.55091814Z",
+          "created_at": "2025-09-03T17:54:23.540282Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -493,7 +493,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:57.959494633Z",
+          "created_at": "2025-09-03T17:54:23.59938Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -515,7 +515,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:58.367117419Z",
+          "created_at": "2025-09-03T17:54:23.658742Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -537,7 +537,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:58.77560425Z",
+          "created_at": "2025-09-03T17:54:23.718569Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -559,7 +559,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:59.183890868Z",
+          "created_at": "2025-09-03T17:54:23.777758Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -581,51 +581,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:04:59.596163097Z",
-          "done": false,
-          "done_reason": null,
-          "total_duration": null,
-          "load_duration": null,
-          "prompt_eval_count": null,
-          "prompt_eval_duration": null,
-          "eval_count": null,
-          "eval_duration": null,
-          "message": {
-            "role": "assistant",
-            "content": " smiling",
-            "thinking": null,
-            "images": null,
-            "tool_calls": null
-          }
-        }
-      },
-      {
-        "__type__": "ollama._types.ChatResponse",
-        "__data__": {
-          "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:00.004002773Z",
-          "done": false,
-          "done_reason": null,
-          "total_duration": null,
-          "load_duration": null,
-          "prompt_eval_count": null,
-          "prompt_eval_duration": null,
-          "eval_count": null,
-          "eval_duration": null,
-          "message": {
-            "role": "assistant",
-            "content": " or",
-            "thinking": null,
-            "images": null,
-            "tool_calls": null
-          }
-        }
-      },
-      {
-        "__type__": "ollama._types.ChatResponse",
-        "__data__": {
-          "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:00.410717383Z",
+          "created_at": "2025-09-03T17:54:23.836924Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -647,7 +603,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:00.817783323Z",
+          "created_at": "2025-09-03T17:54:23.896332Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -669,7 +625,73 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:01.223523865Z",
+          "created_at": "2025-09-03T17:54:23.955491Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " or",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:24.014861Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " b",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:24.074933Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": "arking",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:24.133301Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -691,7 +713,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:01.63351174Z",
+          "created_at": "2025-09-03T17:54:24.192664Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -713,7 +735,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:02.032702205Z",
+          "created_at": "2025-09-03T17:54:24.251448Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -735,7 +757,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:02.424431407Z",
+          "created_at": "2025-09-03T17:54:24.310083Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -757,7 +779,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:02.81524835Z",
+          "created_at": "2025-09-03T17:54:24.369218Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -779,7 +801,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:03.207597567Z",
+          "created_at": "2025-09-03T17:54:24.42843Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -801,7 +823,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:03.614094549Z",
+          "created_at": "2025-09-03T17:54:24.487403Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -823,7 +845,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:04.008232462Z",
+          "created_at": "2025-09-03T17:54:24.547118Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -845,7 +867,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:04.411085956Z",
+          "created_at": "2025-09-03T17:54:24.606557Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -867,7 +889,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:04.80616608Z",
+          "created_at": "2025-09-03T17:54:24.665594Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -889,7 +911,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:05.212911563Z",
+          "created_at": "2025-09-03T17:54:24.725305Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -911,7 +933,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:05.599645826Z",
+          "created_at": "2025-09-03T17:54:24.784482Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -933,7 +955,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:05.998590959Z",
+          "created_at": "2025-09-03T17:54:24.843771Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -955,7 +977,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:06.398745325Z",
+          "created_at": "2025-09-03T17:54:24.903031Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -966,7 +988,7 @@
           "eval_duration": null,
           "message": {
             "role": "assistant",
-            "content": " ears",
+            "content": " eyes",
             "thinking": null,
             "images": null,
             "tool_calls": null
@@ -977,7 +999,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:06.790505624Z",
+          "created_at": "2025-09-03T17:54:24.962328Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -999,7 +1021,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:07.199713609Z",
+          "created_at": "2025-09-03T17:54:25.022265Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1010,7 +1032,7 @@
           "eval_duration": null,
           "message": {
             "role": "assistant",
-            "content": " long",
+            "content": " dark",
             "thinking": null,
             "images": null,
             "tool_calls": null
@@ -1021,7 +1043,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:07.596500603Z",
+          "created_at": "2025-09-03T17:54:25.081666Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1032,7 +1054,7 @@
           "eval_duration": null,
           "message": {
             "role": "assistant",
-            "content": " and",
+            "content": " brown",
             "thinking": null,
             "images": null,
             "tool_calls": null
@@ -1043,29 +1065,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:07.997793386Z",
-          "done": false,
-          "done_reason": null,
-          "total_duration": null,
-          "load_duration": null,
-          "prompt_eval_count": null,
-          "prompt_eval_duration": null,
-          "eval_count": null,
-          "eval_duration": null,
-          "message": {
-            "role": "assistant",
-            "content": " floppy",
-            "thinking": null,
-            "images": null,
-            "tool_calls": null
-          }
-        }
-      },
-      {
-        "__type__": "ollama._types.ChatResponse",
-        "__data__": {
-          "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:08.381509773Z",
+          "created_at": "2025-09-03T17:54:25.140962Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1087,7 +1087,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:08.76579698Z",
+          "created_at": "2025-09-03T17:54:25.200015Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1109,7 +1109,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:09.159673897Z",
+          "created_at": "2025-09-03T17:54:25.259212Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1131,7 +1131,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:09.557596611Z",
+          "created_at": "2025-09-03T17:54:25.318509Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1153,7 +1153,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:09.950543555Z",
+          "created_at": "2025-09-03T17:54:25.377923Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1175,7 +1175,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:10.351722165Z",
+          "created_at": "2025-09-03T17:54:25.436963Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1197,7 +1197,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:10.752622361Z",
+          "created_at": "2025-09-03T17:54:25.4958Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1219,7 +1219,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:11.15541961Z",
+          "created_at": "2025-09-03T17:54:25.554502Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1241,7 +1241,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:11.549741697Z",
+          "created_at": "2025-09-03T17:54:25.613841Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1263,7 +1263,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:11.935619908Z",
+          "created_at": "2025-09-03T17:54:25.673643Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1285,7 +1285,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:12.343367145Z",
+          "created_at": "2025-09-03T17:54:25.733099Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1307,7 +1307,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:12.745897023Z",
+          "created_at": "2025-09-03T17:54:25.792667Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1329,7 +1329,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:13.148396264Z",
+          "created_at": "2025-09-03T17:54:25.853133Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1351,7 +1351,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:13.549096782Z",
+          "created_at": "2025-09-03T17:54:25.912402Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1373,7 +1373,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:13.945126876Z",
+          "created_at": "2025-09-03T17:54:25.971501Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1395,7 +1395,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:14.351732762Z",
+          "created_at": "2025-09-03T17:54:26.031043Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1417,7 +1417,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:14.754792448Z",
+          "created_at": "2025-09-03T17:54:26.090781Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1439,7 +1439,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:15.157906888Z",
+          "created_at": "2025-09-03T17:54:26.150238Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1461,7 +1461,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:15.567665265Z",
+          "created_at": "2025-09-03T17:54:26.209744Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1483,7 +1483,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:15.981925795Z",
+          "created_at": "2025-09-03T17:54:26.269231Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1494,7 +1494,7 @@
           "eval_duration": null,
           "message": {
             "role": "assistant",
-            "content": " outdoors",
+            "content": " a",
             "thinking": null,
             "images": null,
             "tool_calls": null
@@ -1505,7 +1505,95 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:16.388785931Z",
+          "created_at": "2025-09-03T17:54:26.328953Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " park",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:26.38859Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " or",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:26.44816Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " a",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:26.507848Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " field",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:26.567611Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1527,7 +1615,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:16.795150512Z",
+          "created_at": "2025-09-03T17:54:26.627394Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1549,7 +1637,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:17.204509535Z",
+          "created_at": "2025-09-03T17:54:26.688384Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1571,7 +1659,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:17.613690212Z",
+          "created_at": "2025-09-03T17:54:26.750165Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1593,7 +1681,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:18.020711094Z",
+          "created_at": "2025-09-03T17:54:26.809389Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1615,7 +1703,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:18.428597263Z",
+          "created_at": "2025-09-03T17:54:26.868745Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1637,7 +1725,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:18.836863657Z",
+          "created_at": "2025-09-03T17:54:26.928602Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1659,7 +1747,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:19.248527489Z",
+          "created_at": "2025-09-03T17:54:26.988568Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1681,7 +1769,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:19.662063245Z",
+          "created_at": "2025-09-03T17:54:27.04809Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1703,7 +1791,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:20.074553793Z",
+          "created_at": "2025-09-03T17:54:27.107359Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1725,51 +1813,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:20.494386446Z",
-          "done": false,
-          "done_reason": null,
-          "total_duration": null,
-          "load_duration": null,
-          "prompt_eval_count": null,
-          "prompt_eval_duration": null,
-          "eval_count": null,
-          "eval_duration": null,
-          "message": {
-            "role": "assistant",
-            "content": " happiness",
-            "thinking": null,
-            "images": null,
-            "tool_calls": null
-          }
-        }
-      },
-      {
-        "__type__": "ollama._types.ChatResponse",
-        "__data__": {
-          "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:20.905809772Z",
-          "done": false,
-          "done_reason": null,
-          "total_duration": null,
-          "load_duration": null,
-          "prompt_eval_count": null,
-          "prompt_eval_duration": null,
-          "eval_count": null,
-          "eval_duration": null,
-          "message": {
-            "role": "assistant",
-            "content": " and",
-            "thinking": null,
-            "images": null,
-            "tool_calls": null
-          }
-        }
-      },
-      {
-        "__type__": "ollama._types.ChatResponse",
-        "__data__": {
-          "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:21.32374153Z",
+          "created_at": "2025-09-03T17:54:27.16686Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1791,7 +1835,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:21.732533121Z",
+          "created_at": "2025-09-03T17:54:27.226135Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1813,7 +1857,51 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:22.140888939Z",
+          "created_at": "2025-09-03T17:54:27.285472Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " and",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:27.344933Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " energy",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:27.404492Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1835,7 +1923,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:22.552257821Z",
+          "created_at": "2025-09-03T17:54:27.463561Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1857,7 +1945,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:22.970740344Z",
+          "created_at": "2025-09-03T17:54:27.523445Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1879,7 +1967,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:23.380926627Z",
+          "created_at": "2025-09-03T17:54:27.582168Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1901,7 +1989,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:23.790553354Z",
+          "created_at": "2025-09-03T17:54:27.641388Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1923,7 +2011,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:24.202112923Z",
+          "created_at": "2025-09-03T17:54:27.70213Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1945,7 +2033,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:24.612103888Z",
+          "created_at": "2025-09-03T17:54:27.761774Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1967,7 +2055,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:25.019727418Z",
+          "created_at": "2025-09-03T17:54:27.821071Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -1978,7 +2066,7 @@
           "eval_duration": null,
           "message": {
             "role": "assistant",
-            "content": " enjoying",
+            "content": " in",
             "thinking": null,
             "images": null,
             "tool_calls": null
@@ -1989,7 +2077,7 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:25.422980466Z",
+          "created_at": "2025-09-03T17:54:27.880307Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2000,7 +2088,7 @@
           "eval_duration": null,
           "message": {
             "role": "assistant",
-            "content": " itself",
+            "content": " the",
             "thinking": null,
             "images": null,
             "tool_calls": null
@@ -2011,7 +2099,161 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:25.815598412Z",
+          "created_at": "2025-09-03T17:54:27.939228Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " midst",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:27.998568Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " of",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:28.057651Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " an",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:28.117008Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " activity",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:28.176556Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " or",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:28.235557Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " play",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:28.295066Z",
+          "done": false,
+          "done_reason": null,
+          "total_duration": null,
+          "load_duration": null,
+          "prompt_eval_count": null,
+          "prompt_eval_duration": null,
+          "eval_count": null,
+          "eval_duration": null,
+          "message": {
+            "role": "assistant",
+            "content": " session",
+            "thinking": null,
+            "images": null,
+            "tool_calls": null
+          }
+        }
+      },
+      {
+        "__type__": "ollama._types.ChatResponse",
+        "__data__": {
+          "model": "llama3.2-vision:11b",
+          "created_at": "2025-09-03T17:54:28.354418Z",
           "done": false,
           "done_reason": null,
           "total_duration": null,
@@ -2033,15 +2275,15 @@
         "__type__": "ollama._types.ChatResponse",
         "__data__": {
           "model": "llama3.2-vision:11b",
-          "created_at": "2025-08-01T00:05:26.224081261Z",
+          "created_at": "2025-09-03T17:54:28.413798Z",
           "done": true,
           "done_reason": "stop",
-          "total_duration": 37514337521,
-          "load_duration": 60023634,
+          "total_duration": 6299752375,
+          "load_duration": 103264083,
           "prompt_eval_count": 18,
-          "prompt_eval_duration": 561160541,
-          "eval_count": 92,
-          "eval_duration": 36885221241,
+          "prompt_eval_duration": 135920375,
+          "eval_count": 103,
+          "eval_duration": 6055836667,
           "message": {
             "role": "assistant",
             "content": "",
diff --git a/tests/integration/recordings/responses/models-4a3a4447b16b-3057338f.json b/tests/integration/recordings/responses/models-4a3a4447b16b-3057338f.json
new file mode 100644
index 000000000..b2d991bc5
--- /dev/null
+++ b/tests/integration/recordings/responses/models-4a3a4447b16b-3057338f.json
@@ -0,0 +1,164 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "http://localhost:11434/api/tags",
+    "headers": {},
+    "body": {},
+    "endpoint": "/api/tags",
+    "model": ""
+  },
+  "response": {
+    "body": {
+      "__type__": "ollama._types.ListResponse",
+      "__data__": {
+        "models": [
+          {
+            "model": "nomic-embed-text:latest",
+            "modified_at": "2025-09-03T10:54:06.607913-07:00",
+            "digest": "0a109f422b47e3a30ba2b10eca18548e944e8a23073ee3f3e947efcf3c45e59f",
+            "size": 274302450,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "nomic-bert",
+              "families": [
+                "nomic-bert"
+              ],
+              "parameter_size": "137M",
+              "quantization_level": "F16"
+            }
+          },
+          {
+            "model": "all-minilm:l6-v2",
+            "modified_at": "2025-09-03T10:19:06.719933-07:00",
+            "digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
+            "size": 45960996,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "bert",
+              "families": [
+                "bert"
+              ],
+              "parameter_size": "23M",
+              "quantization_level": "F16"
+            }
+          },
+          {
+            "model": "llama3.2-vision:11b",
+            "modified_at": "2025-07-30T18:45:02.517873-07:00",
+            "digest": "6f2f9757ae97e8a3f8ea33d6adb2b11d93d9a35bef277cd2c0b1b5af8e8d0b1e",
+            "size": 7816589186,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "mllama",
+              "families": [
+                "mllama"
+              ],
+              "parameter_size": "10.7B",
+              "quantization_level": "Q4_K_M"
+            }
+          },
+          {
+            "model": "llama3.2-vision:latest",
+            "modified_at": "2025-07-29T20:18:47.920468-07:00",
+            "digest": "6f2f9757ae97e8a3f8ea33d6adb2b11d93d9a35bef277cd2c0b1b5af8e8d0b1e",
+            "size": 7816589186,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "mllama",
+              "families": [
+                "mllama"
+              ],
+              "parameter_size": "10.7B",
+              "quantization_level": "Q4_K_M"
+            }
+          },
+          {
+            "model": "llama-guard3:1b",
+            "modified_at": "2025-07-25T14:39:44.978630-07:00",
+            "digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
+            "size": 1600181919,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "llama",
+              "families": [
+                "llama"
+              ],
+              "parameter_size": "1.5B",
+              "quantization_level": "Q8_0"
+            }
+          },
+          {
+            "model": "llama3.2:1b",
+            "modified_at": "2025-07-17T22:02:24.953208-07:00",
+            "digest": "baf6a787fdffd633537aa2eb51cfd54cb93ff08e28040095462bb63daf552878",
+            "size": 1321098329,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "llama",
+              "families": [
+                "llama"
+              ],
+              "parameter_size": "1.2B",
+              "quantization_level": "Q8_0"
+            }
+          },
+          {
+            "model": "all-minilm:latest",
+            "modified_at": "2025-06-03T16:50:10.946583-07:00",
+            "digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
+            "size": 45960996,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "bert",
+              "families": [
+                "bert"
+              ],
+              "parameter_size": "23M",
+              "quantization_level": "F16"
+            }
+          },
+          {
+            "model": "llama3.2:3b",
+            "modified_at": "2025-05-01T11:15:23.797447-07:00",
+            "digest": "a80c4f17acd55265feec403c7aef86be0c25983ab279d83f3bcd3abbcb5b8b72",
+            "size": 2019393189,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "llama",
+              "families": [
+                "llama"
+              ],
+              "parameter_size": "3.2B",
+              "quantization_level": "Q4_K_M"
+            }
+          },
+          {
+            "model": "llama3.2:3b-instruct-fp16",
+            "modified_at": "2025-04-30T15:33:48.939665-07:00",
+            "digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
+            "size": 6433703586,
+            "details": {
+              "parent_model": "",
+              "format": "gguf",
+              "family": "llama",
+              "families": [
+                "llama"
+              ],
+              "parameter_size": "3.2B",
+              "quantization_level": "F16"
+            }
+          }
+        ]
+      }
+    },
+    "is_streaming": false
+  }
+}
diff --git a/tests/integration/recordings/vision/index.sqlite b/tests/integration/recordings/vision/index.sqlite
deleted file mode 100644
index 6ff587c4321e7260f5a0b22893014468fe04a0ae..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 12288
zcmeI$PiqrF6aer|wHk#aB0_1Uc6(E>?fjpeoJ=K%SpU@?^b}@xX6#D-ncWnx6`>SA
zgBL%BSHFxO!K0IC$%3`TiU{%smdx(XoA>f#FY}%~-O36V`@yKEi<m}NqDm#Y6UR{$
zt%U1bxQ<38OwJ$Ogx|^iX=5c?-#e@|zD9HP!>E4P_<ULbyaxdg009sH0T2KI5C8!X
z009vA&jsGf%Eg7%)yg|nXw!8gmkvfY>%Yurv$?z5?bc2^-f3-awd2|I_~zyKm@#s%
z$1X2AyE@;EciPW);wRhpAGWq%#1GmpZvP@A9}fDt>-enerZLB_bA3A;Wc}iVCB1=l
z-4osySuYf)d&3jfWO*kqMo#yFL%jL;@m9O_=%>1G(YXr?_f{)W*0=6W{<<5^^Bp}d
zLVe-BGh^!D*?e-YuTH+GTDazG2T}b)<67f=?Vx^j@)QOLfB*=900@8p2!H?xfB*=9
zz+V#BuP#^jYa1(+Uh-aAgD@h7B$y}OCyYp{ji5*nL^L;CC7fWZh2(@<Vi=QHVec&y
zsYT`Z^;h|zzoCcOM!KtuZddm-T_<aMS)L90O^i+0kguU+4dED}CgM#Z_NzC3lv4GW
zD`K6K*l}(oQQV}2D~mmrOd_teMoburolGUB#0qOH_0kJU5>3-`{O^_`nwX3irj^ua
zl_pZUu%Af<aW+wi5HGOPR!c$?r3Aw%#>j=rjOSKqVH`_ED32mVye-GiDjANu-R}Z&
zjpCTlCg)9t#*0U3nWmZrUW0{6nBr0yFA#QEBgBPLl5rm_6jwUoDV72olUQyU=SVq8
z%JH+bg?^bIlQv(Pq`e;gtwlN&NouSU${J#cCMaQ!c}tK&DN{u9lv9HefxJVOvNR<3
zh?>+8>5_8%EbZ`^r1Wz5py%r!qejvA)L5^72~!v#00JNY0w4eaAOHd&00JNY0wC}Y
z1ls5KYn5_S<19^)<?p-vVL#)>beHn!`YfmOrRgr^j>K6y8Vl21$_<9IG$<Co0bglz
A5C8xG

diff --git a/tests/integration/recordings/vision/responses/3877ecf1bc62.json b/tests/integration/recordings/vision/responses/3877ecf1bc62.json
deleted file mode 100644
index 819ec31c0..000000000
--- a/tests/integration/recordings/vision/responses/3877ecf1bc62.json
+++ /dev/null
@@ -1,22 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/api/pull",
-    "headers": {},
-    "body": {},
-    "endpoint": "/api/pull",
-    "model": ""
-  },
-  "response": {
-    "body": {
-      "__type__": "ollama._types.ProgressResponse",
-      "__data__": {
-        "status": "success",
-        "completed": null,
-        "total": null,
-        "digest": null
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/4096743baf8e.json b/tests/integration/recordings/vision/responses/4096743baf8e.json
deleted file mode 100644
index 880f1b597..000000000
--- a/tests/integration/recordings/vision/responses/4096743baf8e.json
+++ /dev/null
@@ -1,56 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/v1/v1/completions",
-    "headers": {},
-    "body": {
-      "model": "llama3.2:3b-instruct-fp16",
-      "messages": [
-        {
-          "role": "user",
-          "content": "Test trace openai 0"
-        }
-      ],
-      "stream": false
-    },
-    "endpoint": "/v1/completions",
-    "model": "llama3.2:3b-instruct-fp16"
-  },
-  "response": {
-    "body": {
-      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
-      "__data__": {
-        "id": "chatcmpl-971",
-        "choices": [
-          {
-            "finish_reason": "stop",
-            "index": 0,
-            "logprobs": null,
-            "message": {
-              "content": "I'm happy to help you with testing the test API for OpenAI's Model 0, but I need to clarify a few things.\n\nOpenAI's Model 0 is an early version of their AI model, and it's not publicly available. However, I can simulate some interactions with a hypothetical API that might be similar to what they provide.\n\nHere's an example test:\n```\nPOST /test HTTP/1.1\nHost: 0 api.openai.com\n\nContent-Type: application/json\n\n{\n  \"text\": \"This is a prompt for testing the Model 0 API\"\n}\n```\n\nPlease note that this is not an official API, and you should not try to interact with it directly. However, I can simulate a response for you:\n\n```\nHTTP/1.1 200 OK\nContent-Type: application/json\n\n{\n  \"complete\": false,\n  \"error\": null\n}\n```\n\nIn a real-world scenario, the Model 0 API would likely respond with much more complex and accurate results. For example:\n\n```\nHTTP/1.1 200 OK\nContent-Type: application/json\n\n{\n  \"id\": \"<MODEL_ID>\",\n  \"text\": {\n    \"parent_id\": \"<PARENT_ID>\",\n    \"text\": \"I can generate text similar to human writing.\"\n  }\n}\n```",
-              "refusal": null,
-              "role": "assistant",
-              "annotations": null,
-              "audio": null,
-              "function_call": null,
-              "tool_calls": null
-            }
-          }
-        ],
-        "created": 1754003706,
-        "model": "llama3.2:3b-instruct-fp16",
-        "object": "chat.completion",
-        "service_tier": null,
-        "system_fingerprint": "fp_ollama",
-        "usage": {
-          "completion_tokens": 272,
-          "prompt_tokens": 31,
-          "total_tokens": 303,
-          "completion_tokens_details": null,
-          "prompt_tokens_details": null
-        }
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/4a3a4447b16b.json b/tests/integration/recordings/vision/responses/4a3a4447b16b.json
deleted file mode 100644
index a99e1fcc3..000000000
--- a/tests/integration/recordings/vision/responses/4a3a4447b16b.json
+++ /dev/null
@@ -1,68 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/api/tags",
-    "headers": {},
-    "body": {},
-    "endpoint": "/api/tags",
-    "model": ""
-  },
-  "response": {
-    "body": {
-      "__type__": "ollama._types.ListResponse",
-      "__data__": {
-        "models": [
-          {
-            "model": "nomic-embed-text:latest",
-            "modified_at": "2025-07-31T23:55:40.635067Z",
-            "digest": "0a109f422b47e3a30ba2b10eca18548e944e8a23073ee3f3e947efcf3c45e59f",
-            "size": 274302450,
-            "details": {
-              "parent_model": "",
-              "format": "gguf",
-              "family": "nomic-bert",
-              "families": [
-                "nomic-bert"
-              ],
-              "parameter_size": "137M",
-              "quantization_level": "F16"
-            }
-          },
-          {
-            "model": "all-minilm:l6-v2",
-            "modified_at": "2025-07-30T17:18:31Z",
-            "digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
-            "size": 45960996,
-            "details": {
-              "parent_model": "",
-              "format": "gguf",
-              "family": "bert",
-              "families": [
-                "bert"
-              ],
-              "parameter_size": "23M",
-              "quantization_level": "F16"
-            }
-          },
-          {
-            "model": "llama3.2-vision:11b",
-            "modified_at": "2025-07-30T17:18:21Z",
-            "digest": "6f2f9757ae97e8a3f8ea33d6adb2b11d93d9a35bef277cd2c0b1b5af8e8d0b1e",
-            "size": 7816589186,
-            "details": {
-              "parent_model": "",
-              "format": "gguf",
-              "family": "mllama",
-              "families": [
-                "mllama"
-              ],
-              "parameter_size": "10.7B",
-              "quantization_level": "Q4_K_M"
-            }
-          }
-        ]
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/67198cbad48f.json b/tests/integration/recordings/vision/responses/67198cbad48f.json
deleted file mode 100644
index 8326d5329..000000000
--- a/tests/integration/recordings/vision/responses/67198cbad48f.json
+++ /dev/null
@@ -1,56 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/v1/v1/completions",
-    "headers": {},
-    "body": {
-      "model": "llama3.2:3b-instruct-fp16",
-      "messages": [
-        {
-          "role": "user",
-          "content": "Test OpenAI telemetry creation"
-        }
-      ],
-      "stream": false
-    },
-    "endpoint": "/v1/completions",
-    "model": "llama3.2:3b-instruct-fp16"
-  },
-  "response": {
-    "body": {
-      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
-      "__data__": {
-        "id": "chatcmpl-517",
-        "choices": [
-          {
-            "finish_reason": "stop",
-            "index": 0,
-            "logprobs": null,
-            "message": {
-              "content": "I'm happy to help you test OpenAI's telemetry creation feature. However, I need to inform you that OpenAI's models are not designed for direct testing and may not support the kind of feedback you're looking for.\n\nThat being said, we can try a simulated testing process using this chat interface. Here's how we can go about it:\n\n1. **Test the chat model:** Before we dive into telemetry creation, let's test the conversation system itself.\n2. **Try out general queries and statements**: See if I can respond to various questions and prompt topics with accuracy. This will help you gauge the effectiveness of my language processing abilities within this interface.\n3. **Create a simulated telemetry request:** Based on your feedback about our chat, describe what kind of information would be needed as a telemetry point for monitoring conversations like ours.\n\nGo ahead and give me some test data or prompt topics so we can proceed with creating a simulated \"telemetry\" creation process.",
-              "refusal": null,
-              "role": "assistant",
-              "annotations": null,
-              "audio": null,
-              "function_call": null,
-              "tool_calls": null
-            }
-          }
-        ],
-        "created": 1754003724,
-        "model": "llama3.2:3b-instruct-fp16",
-        "object": "chat.completion",
-        "service_tier": null,
-        "system_fingerprint": "fp_ollama",
-        "usage": {
-          "completion_tokens": 195,
-          "prompt_tokens": 30,
-          "total_tokens": 225,
-          "completion_tokens_details": null,
-          "prompt_tokens_details": null
-        }
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/830a1fe14938.json b/tests/integration/recordings/vision/responses/830a1fe14938.json
deleted file mode 100644
index 2202416c9..000000000
--- a/tests/integration/recordings/vision/responses/830a1fe14938.json
+++ /dev/null
@@ -1,56 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/v1/v1/completions",
-    "headers": {},
-    "body": {
-      "model": "llama3.2:3b-instruct-fp16",
-      "messages": [
-        {
-          "role": "user",
-          "content": "Test trace openai 1"
-        }
-      ],
-      "stream": false
-    },
-    "endpoint": "/v1/completions",
-    "model": "llama3.2:3b-instruct-fp16"
-  },
-  "response": {
-    "body": {
-      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
-      "__data__": {
-        "id": "chatcmpl-434",
-        "choices": [
-          {
-            "finish_reason": "stop",
-            "index": 0,
-            "logprobs": null,
-            "message": {
-              "content": "I don't have information on testing \"OpenAI\" as a product has not been released.",
-              "refusal": null,
-              "role": "assistant",
-              "annotations": null,
-              "audio": null,
-              "function_call": null,
-              "tool_calls": null
-            }
-          }
-        ],
-        "created": 1754003706,
-        "model": "llama3.2:3b-instruct-fp16",
-        "object": "chat.completion",
-        "service_tier": null,
-        "system_fingerprint": "fp_ollama",
-        "usage": {
-          "completion_tokens": 20,
-          "prompt_tokens": 31,
-          "total_tokens": 51,
-          "completion_tokens_details": null,
-          "prompt_tokens_details": null
-        }
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/9c007f300365.json b/tests/integration/recordings/vision/responses/9c007f300365.json
deleted file mode 100644
index f776e16a0..000000000
--- a/tests/integration/recordings/vision/responses/9c007f300365.json
+++ /dev/null
@@ -1,58 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/v1/v1/completions",
-    "headers": {},
-    "body": {
-      "model": "llama3.2:3b-instruct-fp16",
-      "messages": [
-        {
-          "role": "user",
-          "content": "Test trace openai with temperature 0"
-        }
-      ],
-      "max_tokens": 100,
-      "stream": false,
-      "temperature": 0.7
-    },
-    "endpoint": "/v1/completions",
-    "model": "llama3.2:3b-instruct-fp16"
-  },
-  "response": {
-    "body": {
-      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
-      "__data__": {
-        "id": "chatcmpl-413",
-        "choices": [
-          {
-            "finish_reason": "stop",
-            "index": 0,
-            "logprobs": null,
-            "message": {
-              "content": "I can't provide information or guidance on illegal or harmful activities, including testing the OpenAI model at a temperature of 0. Is there anything else I can help you with?",
-              "refusal": null,
-              "role": "assistant",
-              "annotations": null,
-              "audio": null,
-              "function_call": null,
-              "tool_calls": null
-            }
-          }
-        ],
-        "created": 1754003714,
-        "model": "llama3.2:3b-instruct-fp16",
-        "object": "chat.completion",
-        "service_tier": null,
-        "system_fingerprint": "fp_ollama",
-        "usage": {
-          "completion_tokens": 37,
-          "prompt_tokens": 33,
-          "total_tokens": 70,
-          "completion_tokens_details": null,
-          "prompt_tokens_details": null
-        }
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/c9667519ad7c.json b/tests/integration/recordings/vision/responses/c9667519ad7c.json
deleted file mode 100644
index ce0322da9..000000000
--- a/tests/integration/recordings/vision/responses/c9667519ad7c.json
+++ /dev/null
@@ -1,58 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/v1/v1/completions",
-    "headers": {},
-    "body": {
-      "model": "llama3.2:3b-instruct-fp16",
-      "messages": [
-        {
-          "role": "user",
-          "content": "Test trace openai with temperature 1"
-        }
-      ],
-      "max_tokens": 100,
-      "stream": false,
-      "temperature": 0.7
-    },
-    "endpoint": "/v1/completions",
-    "model": "llama3.2:3b-instruct-fp16"
-  },
-  "response": {
-    "body": {
-      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
-      "__data__": {
-        "id": "chatcmpl-82",
-        "choices": [
-          {
-            "finish_reason": "length",
-            "index": 0,
-            "logprobs": null,
-            "message": {
-              "content": "To test the trace functionality of OpenAI's API with a temperature of 1, you can use the following Python code:\n```\nimport torch\nfrom transformers import AutoModelForCausalLM, AutoTokenizer\n\n# Load pre-trained model and tokenizer\nmodel_name = \"CompVis/transformers-base-tiny\"\nmodel = AutoModelForCausalLM.from_pretrained(model_name)\ntokenizer = AutoTokenizer.from_pretrained(model_name)\n\n# Set temperature to 1\ntemperature = 1.",
-              "refusal": null,
-              "role": "assistant",
-              "annotations": null,
-              "audio": null,
-              "function_call": null,
-              "tool_calls": null
-            }
-          }
-        ],
-        "created": 1754003715,
-        "model": "llama3.2:3b-instruct-fp16",
-        "object": "chat.completion",
-        "service_tier": null,
-        "system_fingerprint": "fp_ollama",
-        "usage": {
-          "completion_tokens": 100,
-          "prompt_tokens": 33,
-          "total_tokens": 133,
-          "completion_tokens_details": null,
-          "prompt_tokens_details": null
-        }
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/d0ac68cbde69.json b/tests/integration/recordings/vision/responses/d0ac68cbde69.json
deleted file mode 100644
index b37962fb6..000000000
--- a/tests/integration/recordings/vision/responses/d0ac68cbde69.json
+++ /dev/null
@@ -1,19 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/api/ps",
-    "headers": {},
-    "body": {},
-    "endpoint": "/api/ps",
-    "model": ""
-  },
-  "response": {
-    "body": {
-      "__type__": "ollama._types.ProcessResponse",
-      "__data__": {
-        "models": []
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/integration/recordings/vision/responses/d4f56d7d1996.json b/tests/integration/recordings/vision/responses/d4f56d7d1996.json
deleted file mode 100644
index 47468b71e..000000000
--- a/tests/integration/recordings/vision/responses/d4f56d7d1996.json
+++ /dev/null
@@ -1,56 +0,0 @@
-{
-  "request": {
-    "method": "POST",
-    "url": "http://localhost:11434/v1/v1/completions",
-    "headers": {},
-    "body": {
-      "model": "llama3.2:3b-instruct-fp16",
-      "messages": [
-        {
-          "role": "user",
-          "content": "Test trace openai 2"
-        }
-      ],
-      "stream": false
-    },
-    "endpoint": "/v1/completions",
-    "model": "llama3.2:3b-instruct-fp16"
-  },
-  "response": {
-    "body": {
-      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
-      "__data__": {
-        "id": "chatcmpl-661",
-        "choices": [
-          {
-            "finish_reason": "stop",
-            "index": 0,
-            "logprobs": null,
-            "message": {
-              "content": "You want to test the text-to-image capabilities of the OpenAI 2 model. To do this, we can use a simple interface in Python to prompt the model and see if it generates an image.\n\nHere's an example code snippet that shows how you can test the model:\n```\nimport numpy as np\nfrom PIL import Image\nfrom io import BytesIO\n\n# Load the OpenAI 2 model weights\nmodel_weights = \"path/to/openai2/model_weights.json\"\n\n# Load the model\nmodel = torch.hub.load(\"openai\", \"image-model\", pretrain_model_path=model_weights)\n\n# Set up a prompt for the model\nprompt = \"A picture of a futuristic cityscape at sunset\"\n\n# Use the model to generate an image\nwith torch.no_grad():\n    image = model(prompt, return_tensor=True).numpy()\n\n# Save the generated image to a file\nimg = Image.fromarray(np.uint8(image))\nimg.save(\"generated_image.png\")\n\nprint(\"Generated image saved to 'generated_image.png'\")\n```\nPlease note that:\n\n1. You need to have PyTorch installed (`pip install torch torchvision`) and downloaded the OpenAI 2 model weights from their repository.\n2. The `image-model` library is used for text-to-image synthesis, which can be installed with `pip install image-model`.\n3. You may need to adjust the prompt and the output settings according to your specific use case.\n\nAlso note that, the openai2 model requires pre-trained on CelebA and FFHQ datasets and its text-to-image capabilities might not work as well as trained specifically for this type of task.\n\nYou can find more information about how to use the `image-model` library at their official documentation: https://github.com/karpathy/vis-dlg\n\nAlso, you can try other text-to-image models like DALL-E or Stable Diffusion using Python libraries like Hugging Face Transformers and PyTorch.",
-              "refusal": null,
-              "role": "assistant",
-              "annotations": null,
-              "audio": null,
-              "function_call": null,
-              "tool_calls": null
-            }
-          }
-        ],
-        "created": 1754003713,
-        "model": "llama3.2:3b-instruct-fp16",
-        "object": "chat.completion",
-        "service_tier": null,
-        "system_fingerprint": "fp_ollama",
-        "usage": {
-          "completion_tokens": 395,
-          "prompt_tokens": 31,
-          "total_tokens": 426,
-          "completion_tokens_details": null,
-          "prompt_tokens_details": null
-        }
-      }
-    },
-    "is_streaming": false
-  }
-}
diff --git a/tests/unit/distribution/test_inference_recordings.py b/tests/unit/distribution/test_inference_recordings.py
index dd80b0caf..c69cf319b 100644
--- a/tests/unit/distribution/test_inference_recordings.py
+++ b/tests/unit/distribution/test_inference_recordings.py
@@ -266,7 +266,7 @@ class TestInferenceRecording:
             return real_openai_chat_response
 
         with patch("openai.resources.chat.completions.AsyncCompletions.create", side_effect=mock_create):
-            with inference_recording(mode=InferenceMode.LIVE):
+            with inference_recording(mode=InferenceMode.LIVE, storage_dir="foo"):
                 client = AsyncOpenAI(base_url="http://localhost:11434/v1", api_key="test")
 
                 response = await client.chat.completions.create(

From 02f6e0f53122e9dff575e4b85cfcad83de88eef3 Mon Sep 17 00:00:00 2001
From: Ashwin Bharambe <ashwin.bharambe@gmail.com>
Date: Wed, 3 Sep 2025 15:57:17 -0700
Subject: [PATCH 06/76] fix(tests): set inference mode to be replay by default
 (#3326)

`construct_stack()` relies on the environment variable to know when to
setup the patching infrastructure.


https://github.com/llamastack/llama-stack/blob/c3d3a0b83333a720886c4a846e41ed3ad2766e00/llama_stack/core/stack.py#L314
---
 tests/integration/conftest.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/integration/conftest.py b/tests/integration/conftest.py
index 234d762ce..fd9a54d04 100644
--- a/tests/integration/conftest.py
+++ b/tests/integration/conftest.py
@@ -30,6 +30,8 @@ def pytest_runtest_makereport(item, call):
 def pytest_sessionstart(session):
     # stop macOS from complaining about duplicate OpenMP libraries
     os.environ["KMP_DUPLICATE_LIB_OK"] = "TRUE"
+    if "LLAMA_STACK_TEST_INFERENCE_MODE" not in os.environ:
+        os.environ["LLAMA_STACK_TEST_INFERENCE_MODE"] = "replay"
 
 
 def pytest_runtest_teardown(item):

From 5d52e0d2c5c4550eceeabed5115cf552295819db Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Thu, 4 Sep 2025 04:23:18 -0700
Subject: [PATCH 07/76] chore: handle missing finish_reason (#3328)

# What does this PR do?
Sometimes the stream don't have chunks with finish_reason, e.g. canceled
stream, which throws a pydantic error as OpenAIChoice.finish_reason: str

## Test Plan
observe no more such error when benchmarking
---
 llama_stack/core/routers/inference.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/llama_stack/core/routers/inference.py b/llama_stack/core/routers/inference.py
index 4b66601bb..8dcad85e3 100644
--- a/llama_stack/core/routers/inference.py
+++ b/llama_stack/core/routers/inference.py
@@ -755,7 +755,7 @@ class InferenceRouter(Inference):
                             choices_data[idx] = {
                                 "content_parts": [],
                                 "tool_calls_builder": {},
-                                "finish_reason": None,
+                                "finish_reason": "stop",
                                 "logprobs_content_parts": [],
                             }
                         current_choice_data = choices_data[idx]

From 64d2306dd5481be3fdfaa11c415efe3f2788358e Mon Sep 17 00:00:00 2001
From: Derek Higgins <derekh@redhat.com>
Date: Thu, 4 Sep 2025 16:56:32 +0100
Subject: [PATCH 08/76] fix: distro-codegen pre-commit hook file pattern
 (#3337)

Update the file pattern from 'llama_stack/templates' to
'llama_stack/distributions' to properly trigger the Distribution
Template Codegen hook when distribution files change.

Signed-off-by: Derek Higgins <derekh@redhat.com>
---
 .pre-commit-config.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 514fe6d2e..b7880a9fc 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -86,7 +86,7 @@ repos:
         language: python
         pass_filenames: false
         require_serial: true
-        files: ^llama_stack/templates/.*$|^llama_stack/providers/.*/inference/.*/models\.py$
+        files: ^llama_stack/distributions/.*$|^llama_stack/providers/.*/inference/.*/models\.py$
       - id: provider-codegen
         name: Provider Codegen
         additional_dependencies:

From 85f33762d7cb7495b9aa5946284e4b6c85f5ad96 Mon Sep 17 00:00:00 2001
From: IAN MILLER <75687988+r3v5@users.noreply.github.com>
Date: Thu, 4 Sep 2025 17:15:13 +0100
Subject: [PATCH 09/76] refactor(server): remove hardcoded 409 and 404 status
 codes in server.py using httpx constants (#3333)

# What does this PR do?
<!-- Provide a short summary of what this PR does and why. Link to
relevant issues if applicable. -->
This PR is eliminating hardcoded status codes: `409` CONFLICT and `404`
NOT_FOUND in `server.py` using `httpx` built-in constants. This
implementation will follow the existing structure to improve
readability, extensibility and developer experience. This is already was
implemented in #3131

<!-- If resolving an issue, uncomment and update the line below -->
<!-- Closes #[issue-number] -->

## Test Plan
<!-- Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.* -->
`./scripts/unit-tests.sh`
---
 llama_stack/core/server/server.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/llama_stack/core/server/server.py b/llama_stack/core/server/server.py
index d6dfc3435..b247a610d 100644
--- a/llama_stack/core/server/server.py
+++ b/llama_stack/core/server/server.py
@@ -132,9 +132,9 @@ def translate_exception(exc: Exception) -> HTTPException | RequestValidationErro
             },
         )
     elif isinstance(exc, ConflictError):
-        return HTTPException(status_code=409, detail=str(exc))
+        return HTTPException(status_code=httpx.codes.CONFLICT, detail=str(exc))
     elif isinstance(exc, ResourceNotFoundError):
-        return HTTPException(status_code=404, detail=str(exc))
+        return HTTPException(status_code=httpx.codes.NOT_FOUND, detail=str(exc))
     elif isinstance(exc, ValueError):
         return HTTPException(status_code=httpx.codes.BAD_REQUEST, detail=f"Invalid value: {str(exc)}")
     elif isinstance(exc, BadRequestError):

From 5bbca56cfc24cd1a1d4d5aff6a9c1c4ad12a741a Mon Sep 17 00:00:00 2001
From: Derek Higgins <derekh@redhat.com>
Date: Thu, 4 Sep 2025 18:58:41 +0100
Subject: [PATCH 10/76] fix: Make SentenceTransformer embedding operations
 non-blocking (#3335)

- Wrap model loading with asyncio.to_thread() to prevent blocking during
model download/initialization
- Wrap encoding operations with asyncio.to_thread() to run in background
thread
- Convert _load_sentence_transformer_model() to async method

This ensures the async event loop remains responsive during embedding
operations.

Closes: #3332

Signed-off-by: Derek Higgins <derekh@redhat.com>
Co-authored-by: Francisco Arceo <arceofrancisco@gmail.com>
---
 .../utils/inference/embedding_mixin.py        | 23 ++++++++++++-------
 1 file changed, 15 insertions(+), 8 deletions(-)

diff --git a/llama_stack/providers/utils/inference/embedding_mixin.py b/llama_stack/providers/utils/inference/embedding_mixin.py
index 65ba2854b..9bd0aa8ce 100644
--- a/llama_stack/providers/utils/inference/embedding_mixin.py
+++ b/llama_stack/providers/utils/inference/embedding_mixin.py
@@ -4,6 +4,7 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 
+import asyncio
 import base64
 import struct
 from typing import TYPE_CHECKING
@@ -43,9 +44,11 @@ class SentenceTransformerEmbeddingMixin:
         task_type: EmbeddingTaskType | None = None,
     ) -> EmbeddingsResponse:
         model = await self.model_store.get_model(model_id)
-        embedding_model = self._load_sentence_transformer_model(model.provider_resource_id)
-        embeddings = embedding_model.encode(
-            [interleaved_content_as_str(content) for content in contents], show_progress_bar=False
+        embedding_model = await self._load_sentence_transformer_model(model.provider_resource_id)
+        embeddings = await asyncio.to_thread(
+            embedding_model.encode,
+            [interleaved_content_as_str(content) for content in contents],
+            show_progress_bar=False,
         )
         return EmbeddingsResponse(embeddings=embeddings)
 
@@ -64,8 +67,8 @@ class SentenceTransformerEmbeddingMixin:
 
         # Get the model and generate embeddings
         model_obj = await self.model_store.get_model(model)
-        embedding_model = self._load_sentence_transformer_model(model_obj.provider_resource_id)
-        embeddings = embedding_model.encode(input_list, show_progress_bar=False)
+        embedding_model = await self._load_sentence_transformer_model(model_obj.provider_resource_id)
+        embeddings = await asyncio.to_thread(embedding_model.encode, input_list, show_progress_bar=False)
 
         # Convert embeddings to the requested format
         data = []
@@ -93,7 +96,7 @@ class SentenceTransformerEmbeddingMixin:
             usage=usage,
         )
 
-    def _load_sentence_transformer_model(self, model: str) -> "SentenceTransformer":
+    async def _load_sentence_transformer_model(self, model: str) -> "SentenceTransformer":
         global EMBEDDING_MODELS
 
         loaded_model = EMBEDDING_MODELS.get(model)
@@ -101,8 +104,12 @@ class SentenceTransformerEmbeddingMixin:
             return loaded_model
 
         log.info(f"Loading sentence transformer for {model}...")
-        from sentence_transformers import SentenceTransformer
 
-        loaded_model = SentenceTransformer(model)
+        def _load_model():
+            from sentence_transformers import SentenceTransformer
+
+            return SentenceTransformer(model)
+
+        loaded_model = await asyncio.to_thread(_load_model)
         EMBEDDING_MODELS[model] = loaded_model
         return loaded_model

From bcc7f2c7d0a24a4671e98134e6c28f74e6acff26 Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Thu, 4 Sep 2025 11:37:46 -0700
Subject: [PATCH 11/76] chore: async inference store write (#3318)

# What does this PR do?


## Test Plan
```
cd /docs/source/distributions/k8s-benchmark
# start mock server
python openai-mock-server.py --port 8000
# start stack server
uv run --with llama-stack python -m llama_stack.core.server.server docs/source/distributions/k8s-benchmark/stack_run_config.yaml
# run benchmark script
uv run python3 benchmark.py --duration 30 --concurrent 50 --base-url=http://localhost:8321/v1/openai/v1 --model=vllm-inference/meta-llama/Llama-3.2-3B-Instruct
```
Before:

============================================================
BENCHMARK RESULTS
============================================================
Total time: 30.00s
Concurrent users: 50
Total requests: 1267
Successful requests: 1267
Failed requests: 0
Success rate: 100.0%
Requests per second: 42.23


After:

============================================================
BENCHMARK RESULTS
============================================================
Total time: 30.00s
Concurrent users: 50
Total requests: 1449
Successful requests: 1449
Failed requests: 0
Success rate: 100.0%
Requests per second: 48.30
---
 .../distributions/k8s-benchmark/stack_run_config.yaml     | 8 ++++++++
 llama_stack/core/routers/inference.py                     | 4 ++--
 2 files changed, 10 insertions(+), 2 deletions(-)

diff --git a/docs/source/distributions/k8s-benchmark/stack_run_config.yaml b/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
index ceb1ba2d9..5a810639e 100644
--- a/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
+++ b/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
@@ -3,6 +3,7 @@ image_name: kubernetes-benchmark-demo
 apis:
 - agents
 - inference
+- safety
 - telemetry
 - tool_runtime
 - vector_io
@@ -30,6 +31,11 @@ providers:
         db: ${env.POSTGRES_DB:=llamastack}
         user: ${env.POSTGRES_USER:=llamastack}
         password: ${env.POSTGRES_PASSWORD:=llamastack}
+  safety:
+  - provider_id: llama-guard
+    provider_type: inline::llama-guard
+    config:
+      excluded_categories: []
   agents:
   - provider_id: meta-reference
     provider_type: inline::meta-reference
@@ -95,6 +101,8 @@ models:
 - model_id: ${env.INFERENCE_MODEL}
   provider_id: vllm-inference
   model_type: llm
+shields:
+- shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
 vector_dbs: []
 datasets: []
 scoring_fns: []
diff --git a/llama_stack/core/routers/inference.py b/llama_stack/core/routers/inference.py
index 8dcad85e3..045093fe0 100644
--- a/llama_stack/core/routers/inference.py
+++ b/llama_stack/core/routers/inference.py
@@ -527,7 +527,7 @@ class InferenceRouter(Inference):
 
         # Store the response with the ID that will be returned to the client
         if self.store:
-            await self.store.store_chat_completion(response, messages)
+            asyncio.create_task(self.store.store_chat_completion(response, messages))
 
         if self.telemetry:
             metrics = self._construct_metrics(
@@ -855,4 +855,4 @@ class InferenceRouter(Inference):
                     object="chat.completion",
                 )
                 logger.debug(f"InferenceRouter.completion_response: {final_response}")
-                await self.store.store_chat_completion(final_response, messages)
+                asyncio.create_task(self.store.store_chat_completion(final_response, messages))

From 561d2fc6b8226f167bb9782e6619d86a092af8e8 Mon Sep 17 00:00:00 2001
From: slekkala1 <swapna942@meta.com>
Date: Thu, 4 Sep 2025 11:47:46 -0700
Subject: [PATCH 12/76] fix: Move to older version for docker container failure
 [fireworks-ai] (#3338)

# What does this PR do?
Noticed the test
https://github.com/llamastack/llama-stack-ops/actions/workflows/test-maybe-cut.yaml
are still failing randomly.

Earlier fixed this with 0.18.0 of fireworks here
https://github.com/llamastack/llama-stack/pull/3267, the local testing
may have inadvertently picked a lower version with `<=` which I assumed
picks latest version.
Now tested with `==` to find the version where it broke and pinning to
version(`<=`) where it was passing.


## Test Plan
Tested locally with the following commands to start a container

Build container
`llama stack build --distro starter --image-type container`
start container `docker run -d -p 8321:8321 --name llama-stack-test
distribution-starter:0.2.20`
check health `http://localhost:8321/v1/health`
Above steps fails without the fix

Tested with `==` to ensure the same version is picked in local testing
instead of anything lower.

Following here for the fix from `fireworks-ai`
https://discord.com/channels/1137072072808472616/1410674695597981778/1410674695597981778

https://github.com/llamastack/llama-stack/issues/3273
---
 llama_stack/providers/registry/inference.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index fb841afdf..50956f58c 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -116,7 +116,7 @@ def available_providers() -> list[ProviderSpec]:
             adapter=AdapterSpec(
                 adapter_type="fireworks",
                 pip_packages=[
-                    "fireworks-ai<=0.18.0",
+                    "fireworks-ai<=0.17.16",
                 ],
                 module="llama_stack.providers.remote.inference.fireworks",
                 config_class="llama_stack.providers.remote.inference.fireworks.FireworksImplConfig",

From 55a8c5f439b710cfbb1256e3d6c41a6d82601970 Mon Sep 17 00:00:00 2001
From: Sumanth Kamenani <skamenan@redhat.com>
Date: Thu, 4 Sep 2025 16:25:02 -0400
Subject: [PATCH 13/76] fix: show descriptive MCP server connection errors
 instead of generic 500s (#3256)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

What does this PR do?

Fixes error handling when MCP server connections fail. Instead of
returning generic 500 errors, now provides
   descriptive error messages with proper HTTP status codes.

  Closes #3107

  Test Plan

  Before fix:
curl -X GET
"http://localhost:8321/v1/tool-runtime/list-tools?tool_group_id=bad-mcp-server"
Returns: {"detail": "Internal server error: An unexpected error
occurred."} (500)

  After fix:
curl -X GET
"http://localhost:8321/v1/tool-runtime/list-tools?tool_group_id=bad-mcp-server"
Returns: {"error": {"detail": "Failed to connect to MCP server at
http://localhost:9999/sse: Connection
  refused"}} (502)

  Tests:
  - Added unit test for ConnectionError → 502 translation
  - Manually tested with unreachable MCP servers (connection refused)
---
 llama_stack/core/server/server.py        |  2 ++
 llama_stack/providers/utils/tools/mcp.py | 32 ++++++++++++++++++++++++
 tests/unit/server/test_server.py         |  9 +++++++
 3 files changed, 43 insertions(+)

diff --git a/llama_stack/core/server/server.py b/llama_stack/core/server/server.py
index b247a610d..288bf46e1 100644
--- a/llama_stack/core/server/server.py
+++ b/llama_stack/core/server/server.py
@@ -141,6 +141,8 @@ def translate_exception(exc: Exception) -> HTTPException | RequestValidationErro
         return HTTPException(status_code=httpx.codes.BAD_REQUEST, detail=str(exc))
     elif isinstance(exc, PermissionError | AccessDeniedError):
         return HTTPException(status_code=httpx.codes.FORBIDDEN, detail=f"Permission denied: {str(exc)}")
+    elif isinstance(exc, ConnectionError | httpx.ConnectError):
+        return HTTPException(status_code=httpx.codes.BAD_GATEWAY, detail=str(exc))
     elif isinstance(exc, asyncio.TimeoutError | TimeoutError):
         return HTTPException(status_code=httpx.codes.GATEWAY_TIMEOUT, detail=f"Operation timed out: {str(exc)}")
     elif isinstance(exc, NotImplementedError):
diff --git a/llama_stack/providers/utils/tools/mcp.py b/llama_stack/providers/utils/tools/mcp.py
index 02f7aaf8a..fc8e2f377 100644
--- a/llama_stack/providers/utils/tools/mcp.py
+++ b/llama_stack/providers/utils/tools/mcp.py
@@ -67,6 +67,38 @@ async def client_wrapper(endpoint: str, headers: dict[str, str]) -> AsyncGenerat
                     raise AuthenticationRequiredError(exc) from exc
             if i == len(connection_strategies) - 1:
                 raise
+        except* httpx.ConnectError as eg:
+            # Connection refused, server down, network unreachable
+            if i == len(connection_strategies) - 1:
+                error_msg = f"Failed to connect to MCP server at {endpoint}: Connection refused"
+                logger.error(f"MCP connection error: {error_msg}")
+                raise ConnectionError(error_msg) from eg
+            else:
+                logger.warning(
+                    f"failed to connect to MCP server at {endpoint} via {strategy.name}, falling back to {connection_strategies[i + 1].name}"
+                )
+        except* httpx.TimeoutException as eg:
+            # Request timeout, server too slow
+            if i == len(connection_strategies) - 1:
+                error_msg = f"MCP server at {endpoint} timed out"
+                logger.error(f"MCP timeout error: {error_msg}")
+                raise TimeoutError(error_msg) from eg
+            else:
+                logger.warning(
+                    f"MCP server at {endpoint} timed out via {strategy.name}, falling back to {connection_strategies[i + 1].name}"
+                )
+        except* httpx.RequestError as eg:
+            # DNS resolution failures, network errors, invalid URLs
+            if i == len(connection_strategies) - 1:
+                # Get the first exception's message for the error string
+                exc_msg = str(eg.exceptions[0]) if eg.exceptions else "Unknown error"
+                error_msg = f"Network error connecting to MCP server at {endpoint}: {exc_msg}"
+                logger.error(f"MCP network error: {error_msg}")
+                raise ConnectionError(error_msg) from eg
+            else:
+                logger.warning(
+                    f"network error connecting to MCP server at {endpoint} via {strategy.name}, falling back to {connection_strategies[i + 1].name}"
+                )
         except* McpError:
             if i < len(connection_strategies) - 1:
                 logger.warning(
diff --git a/tests/unit/server/test_server.py b/tests/unit/server/test_server.py
index 803111fc7..f21bbdd67 100644
--- a/tests/unit/server/test_server.py
+++ b/tests/unit/server/test_server.py
@@ -113,6 +113,15 @@ class TestTranslateException:
         assert result.status_code == 504
         assert result.detail == "Operation timed out: "
 
+    def test_translate_connection_error(self):
+        """Test that ConnectionError is translated to 502 HTTP status."""
+        exc = ConnectionError("Failed to connect to MCP server at http://localhost:9999/sse: Connection refused")
+        result = translate_exception(exc)
+
+        assert isinstance(result, HTTPException)
+        assert result.status_code == 502
+        assert result.detail == "Failed to connect to MCP server at http://localhost:9999/sse: Connection refused"
+
     def test_translate_not_implemented_error(self):
         """Test that NotImplementedError is translated to 501 HTTP status."""
         exc = NotImplementedError("Not implemented")

From 3a7ac4227d4a2c0a74e3a7e5eda459ae19761c03 Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Thu, 4 Sep 2025 15:13:31 -0700
Subject: [PATCH 14/76] chore: unbreak inference store test (#3340)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

# What does this PR do?
The inference store writes were moved to asyncio.create_task and not
await anymore

## Test Plan

❯ OLLAMA_URL=http://localhost:11434 LLAMA_STACK_CONFIG=server:starter uv
run --with pytest-repeat pytest tests/integration/inference
--text-model="ollama/llama3.2:3b-instruct-fp16" -vvs -k
"test_inference_store_tool_calls and 3b-instruct-fp16-True" --count=10
Uninstalled 2 packages in 102ms
Installed 2 packages in 138ms
INFO 2025-09-04 14:10:17,775 tests.integration.conftest:66 tests:
Setting DISABLE_CODE_SANDBOX=1 for macOS

==========================================================================================================
test session starts
===========================================================================================================
platform darwin -- Python 3.12.3, pytest-8.4.1, pluggy-1.6.0 --
/Users/erichuang/.cache/uv/builds-v0/.tmpSGMlgt/bin/python
cachedir: .pytest_cache
metadata: {'Python': '3.12.3', 'Platform':
'macOS-15.6.1-arm64-arm-64bit', 'Packages': {'pytest': '8.4.1',
'pluggy': '1.6.0'}, 'Plugins': {'repeat': '0.9.4', 'anyio': '4.9.0',
'html': '4.1.1', 'socket': '0.7.0', 'asyncio': '1.1.0', 'json-report':
'1.5.0', 'timeout': '2.4.0', 'metadata': '3.1.1', 'cov': '6.2.1',
'nbval': '0.11.0'}}
rootdir: /Users/erichuang/projects/llama-stack-git
configfile: pyproject.toml
plugins: repeat-0.9.4, anyio-4.9.0, html-4.1.1, socket-0.7.0,
asyncio-1.1.0, json-report-1.5.0, timeout-2.4.0, metadata-3.1.1,
cov-6.2.1, nbval-0.11.0
asyncio: mode=Mode.AUTO, asyncio_default_fixture_loop_scope=None,
asyncio_default_test_loop_scope=function
collected 970 items / 950 deselected / 20 selected


tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-1-10]
instantiating llama_stack_client
Starting llama stack server with config 'starter' on port 8321...
Waiting for server at http://localhost:8321... (0.0s elapsed)
Waiting for server at http://localhost:8321... (0.5s elapsed)
Waiting for server at http://localhost:8321... (5.1s elapsed)
Waiting for server at http://localhost:8321... (5.6s elapsed)
Waiting for server at http://localhost:8321... (10.1s elapsed)
Waiting for server at http://localhost:8321... (10.6s elapsed)
Waiting for server at http://localhost:8321... (15.2s elapsed)
Waiting for server at http://localhost:8321... (15.7s elapsed)
Server is ready at http://localhost:8321
llama_stack_client instantiated in 20.583s
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-2-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-3-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-4-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-5-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-6-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-7-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-8-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-9-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=ollama/llama3.2:3b-instruct-fp16-True-10-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-1-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-2-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-3-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-4-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-5-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-6-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-7-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-8-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-9-10]
PASSED

tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True-10-10]
PASSEDTerminating llama stack server process...
Terminating process 53307 and its group...
Server process and children terminated gracefully
---
 .../inference/test_openai_completion.py       | 25 +++++++++++++++++--
 1 file changed, 23 insertions(+), 2 deletions(-)

diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index 72137662d..62185e470 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -5,6 +5,8 @@
 # the root directory of this source tree.
 
 
+import time
+
 import pytest
 
 from ..test_cases.test_case import TestCase
@@ -323,8 +325,15 @@ def test_inference_store(compat_client, client_with_models, text_model_id, strea
         response_id = response.id
         content = response.choices[0].message.content
 
-    responses = client.chat.completions.list(limit=1000)
-    assert response_id in [r.id for r in responses.data]
+    tries = 0
+    while tries < 10:
+        responses = client.chat.completions.list(limit=1000)
+        if response_id in [r.id for r in responses.data]:
+            break
+        else:
+            tries += 1
+            time.sleep(0.1)
+    assert tries < 10, f"Response {response_id} not found after 1 second"
 
     retrieved_response = client.chat.completions.retrieve(response_id)
     assert retrieved_response.id == response_id
@@ -388,6 +397,18 @@ def test_inference_store_tool_calls(compat_client, client_with_models, text_mode
         response_id = response.id
         content = response.choices[0].message.content
 
+    # wait for the response to be stored
+    tries = 0
+    while tries < 10:
+        responses = client.chat.completions.list(limit=1000)
+        if response_id in [r.id for r in responses.data]:
+            break
+        else:
+            tries += 1
+            time.sleep(0.1)
+
+    assert tries < 10, f"Response {response_id} not found after 1 second"
+
     responses = client.chat.completions.list(limit=1000)
     assert response_id in [r.id for r in responses.data]
 

From 0b00c68d59d28ea4a502ccb54708bd384c4dea73 Mon Sep 17 00:00:00 2001
From: Sumanth Kamenani <skamenan@redhat.com>
Date: Fri, 5 Sep 2025 04:45:11 -0400
Subject: [PATCH 15/76] fix: use lambda pattern for bedrock config env vars
 (#3307)

# What does this PR do?

Improved bedrock provider config to read from environment variables like
AWS_ACCESS_KEY_ID. Updated all
fields to use default_factory with lambda patterns like the nvidia
provider does.

  Now the environment variables work as documented.

  Closes #3305

  ## Test Plan

  Ran the new bedrock config tests:
  ```bash
python -m pytest tests/unit/providers/inference/bedrock/test_config.py
-v

Verified existing provider tests still work:
  python -m pytest tests/unit/providers/test_configs.py -v
---
 .../providers/inference/remote_bedrock.md     |  4 +-
 .../source/providers/safety/remote_bedrock.md |  4 +-
 llama_stack/providers/utils/bedrock/config.py | 22 ++++---
 .../inference/bedrock/test_config.py          | 63 +++++++++++++++++++
 4 files changed, 79 insertions(+), 14 deletions(-)
 create mode 100644 tests/unit/providers/inference/bedrock/test_config.py

diff --git a/docs/source/providers/inference/remote_bedrock.md b/docs/source/providers/inference/remote_bedrock.md
index 1454c54c2..216dd4adb 100644
--- a/docs/source/providers/inference/remote_bedrock.md
+++ b/docs/source/providers/inference/remote_bedrock.md
@@ -15,8 +15,8 @@ AWS Bedrock inference provider for accessing various AI models through AWS's man
 | `profile_name` | `str \| None` | No |  | The profile name that contains credentials to use.Default use environment variable: AWS_PROFILE |
 | `total_max_attempts` | `int \| None` | No |  | An integer representing the maximum number of attempts that will be made for a single request, including the initial attempt. Default use environment variable: AWS_MAX_ATTEMPTS |
 | `retry_mode` | `str \| None` | No |  | A string representing the type of retries Boto3 will perform.Default use environment variable: AWS_RETRY_MODE |
-| `connect_timeout` | `float \| None` | No | 60 | The time in seconds till a timeout exception is thrown when attempting to make a connection. The default is 60 seconds. |
-| `read_timeout` | `float \| None` | No | 60 | The time in seconds till a timeout exception is thrown when attempting to read from a connection.The default is 60 seconds. |
+| `connect_timeout` | `float \| None` | No | 60.0 | The time in seconds till a timeout exception is thrown when attempting to make a connection. The default is 60 seconds. |
+| `read_timeout` | `float \| None` | No | 60.0 | The time in seconds till a timeout exception is thrown when attempting to read from a connection.The default is 60 seconds. |
 | `session_ttl` | `int \| None` | No | 3600 | The time in seconds till a session expires. The default is 3600 seconds (1 hour). |
 
 ## Sample Configuration
diff --git a/docs/source/providers/safety/remote_bedrock.md b/docs/source/providers/safety/remote_bedrock.md
index 3c1d6bcb0..99d77dd72 100644
--- a/docs/source/providers/safety/remote_bedrock.md
+++ b/docs/source/providers/safety/remote_bedrock.md
@@ -15,8 +15,8 @@ AWS Bedrock safety provider for content moderation using AWS's safety services.
 | `profile_name` | `str \| None` | No |  | The profile name that contains credentials to use.Default use environment variable: AWS_PROFILE |
 | `total_max_attempts` | `int \| None` | No |  | An integer representing the maximum number of attempts that will be made for a single request, including the initial attempt. Default use environment variable: AWS_MAX_ATTEMPTS |
 | `retry_mode` | `str \| None` | No |  | A string representing the type of retries Boto3 will perform.Default use environment variable: AWS_RETRY_MODE |
-| `connect_timeout` | `float \| None` | No | 60 | The time in seconds till a timeout exception is thrown when attempting to make a connection. The default is 60 seconds. |
-| `read_timeout` | `float \| None` | No | 60 | The time in seconds till a timeout exception is thrown when attempting to read from a connection.The default is 60 seconds. |
+| `connect_timeout` | `float \| None` | No | 60.0 | The time in seconds till a timeout exception is thrown when attempting to make a connection. The default is 60 seconds. |
+| `read_timeout` | `float \| None` | No | 60.0 | The time in seconds till a timeout exception is thrown when attempting to read from a connection.The default is 60 seconds. |
 | `session_ttl` | `int \| None` | No | 3600 | The time in seconds till a session expires. The default is 3600 seconds (1 hour). |
 
 ## Sample Configuration
diff --git a/llama_stack/providers/utils/bedrock/config.py b/llama_stack/providers/utils/bedrock/config.py
index b25617d76..2745c88cb 100644
--- a/llama_stack/providers/utils/bedrock/config.py
+++ b/llama_stack/providers/utils/bedrock/config.py
@@ -4,53 +4,55 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 
+import os
+
 from pydantic import BaseModel, Field
 
 
 class BedrockBaseConfig(BaseModel):
     aws_access_key_id: str | None = Field(
-        default=None,
+        default_factory=lambda: os.getenv("AWS_ACCESS_KEY_ID"),
         description="The AWS access key to use. Default use environment variable: AWS_ACCESS_KEY_ID",
     )
     aws_secret_access_key: str | None = Field(
-        default=None,
+        default_factory=lambda: os.getenv("AWS_SECRET_ACCESS_KEY"),
         description="The AWS secret access key to use. Default use environment variable: AWS_SECRET_ACCESS_KEY",
     )
     aws_session_token: str | None = Field(
-        default=None,
+        default_factory=lambda: os.getenv("AWS_SESSION_TOKEN"),
         description="The AWS session token to use. Default use environment variable: AWS_SESSION_TOKEN",
     )
     region_name: str | None = Field(
-        default=None,
+        default_factory=lambda: os.getenv("AWS_DEFAULT_REGION"),
         description="The default AWS Region to use, for example, us-west-1 or us-west-2."
         "Default use environment variable: AWS_DEFAULT_REGION",
     )
     profile_name: str | None = Field(
-        default=None,
+        default_factory=lambda: os.getenv("AWS_PROFILE"),
         description="The profile name that contains credentials to use.Default use environment variable: AWS_PROFILE",
     )
     total_max_attempts: int | None = Field(
-        default=None,
+        default_factory=lambda: int(val) if (val := os.getenv("AWS_MAX_ATTEMPTS")) else None,
         description="An integer representing the maximum number of attempts that will be made for a single request, "
         "including the initial attempt. Default use environment variable: AWS_MAX_ATTEMPTS",
     )
     retry_mode: str | None = Field(
-        default=None,
+        default_factory=lambda: os.getenv("AWS_RETRY_MODE"),
         description="A string representing the type of retries Boto3 will perform."
         "Default use environment variable: AWS_RETRY_MODE",
     )
     connect_timeout: float | None = Field(
-        default=60,
+        default_factory=lambda: float(os.getenv("AWS_CONNECT_TIMEOUT", "60")),
         description="The time in seconds till a timeout exception is thrown when attempting to make a connection. "
         "The default is 60 seconds.",
     )
     read_timeout: float | None = Field(
-        default=60,
+        default_factory=lambda: float(os.getenv("AWS_READ_TIMEOUT", "60")),
         description="The time in seconds till a timeout exception is thrown when attempting to read from a connection."
         "The default is 60 seconds.",
     )
     session_ttl: int | None = Field(
-        default=3600,
+        default_factory=lambda: int(os.getenv("AWS_SESSION_TTL", "3600")),
         description="The time in seconds till a session expires. The default is 3600 seconds (1 hour).",
     )
 
diff --git a/tests/unit/providers/inference/bedrock/test_config.py b/tests/unit/providers/inference/bedrock/test_config.py
new file mode 100644
index 000000000..1b8639f2e
--- /dev/null
+++ b/tests/unit/providers/inference/bedrock/test_config.py
@@ -0,0 +1,63 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+import os
+from unittest.mock import patch
+
+from llama_stack.providers.utils.bedrock.config import BedrockBaseConfig
+
+
+class TestBedrockBaseConfig:
+    def test_defaults_work_without_env_vars(self):
+        with patch.dict(os.environ, {}, clear=True):
+            config = BedrockBaseConfig()
+
+            # Basic creds should be None
+            assert config.aws_access_key_id is None
+            assert config.aws_secret_access_key is None
+            assert config.region_name is None
+
+            # Timeouts get defaults
+            assert config.connect_timeout == 60.0
+            assert config.read_timeout == 60.0
+            assert config.session_ttl == 3600
+
+    def test_env_vars_get_picked_up(self):
+        env_vars = {
+            "AWS_ACCESS_KEY_ID": "AKIATEST123",
+            "AWS_SECRET_ACCESS_KEY": "secret123",
+            "AWS_DEFAULT_REGION": "us-west-2",
+            "AWS_MAX_ATTEMPTS": "5",
+            "AWS_RETRY_MODE": "adaptive",
+            "AWS_CONNECT_TIMEOUT": "30",
+        }
+
+        with patch.dict(os.environ, env_vars, clear=True):
+            config = BedrockBaseConfig()
+
+            assert config.aws_access_key_id == "AKIATEST123"
+            assert config.aws_secret_access_key == "secret123"
+            assert config.region_name == "us-west-2"
+            assert config.total_max_attempts == 5
+            assert config.retry_mode == "adaptive"
+            assert config.connect_timeout == 30.0
+
+    def test_partial_env_setup(self):
+        # Just setting one timeout var
+        with patch.dict(os.environ, {"AWS_CONNECT_TIMEOUT": "120"}, clear=True):
+            config = BedrockBaseConfig()
+
+            assert config.connect_timeout == 120.0
+            assert config.read_timeout == 60.0  # still default
+            assert config.aws_access_key_id is None
+
+    def test_bad_max_attempts_breaks(self):
+        with patch.dict(os.environ, {"AWS_MAX_ATTEMPTS": "not_a_number"}, clear=True):
+            try:
+                BedrockBaseConfig()
+                raise AssertionError("Should have failed on bad int conversion")
+            except ValueError:
+                pass  # expected

From 64b297716247317a0e0714b61fc7ee77bbfb9e52 Mon Sep 17 00:00:00 2001
From: Derek Higgins <derekh@redhat.com>
Date: Fri, 5 Sep 2025 13:09:36 +0100
Subject: [PATCH 16/76] fix: Fix locations of distrubution runtime directories
 (#3336)

The defaults were mixed up

Signed-off-by: Derek Higgins <derekh@redhat.com>
---
 llama_stack/distributions/ci-tests/ci_tests.py |  4 +---
 llama_stack/distributions/ci-tests/run.yaml    | 18 +++++++++---------
 llama_stack/distributions/starter-gpu/run.yaml | 18 +++++++++---------
 .../distributions/starter-gpu/starter_gpu.py   |  4 +---
 llama_stack/distributions/starter/starter.py   |  3 +--
 5 files changed, 21 insertions(+), 26 deletions(-)

diff --git a/llama_stack/distributions/ci-tests/ci_tests.py b/llama_stack/distributions/ci-tests/ci_tests.py
index 8fb61faca..ab102f5f3 100644
--- a/llama_stack/distributions/ci-tests/ci_tests.py
+++ b/llama_stack/distributions/ci-tests/ci_tests.py
@@ -11,9 +11,7 @@ from ..starter.starter import get_distribution_template as get_starter_distribut
 
 
 def get_distribution_template() -> DistributionTemplate:
-    template = get_starter_distribution_template()
-    name = "ci-tests"
-    template.name = name
+    template = get_starter_distribution_template(name="ci-tests")
     template.description = "CI tests for Llama Stack"
 
     return template
diff --git a/llama_stack/distributions/ci-tests/run.yaml b/llama_stack/distributions/ci-tests/run.yaml
index 7523df581..26a677c7a 100644
--- a/llama_stack/distributions/ci-tests/run.yaml
+++ b/llama_stack/distributions/ci-tests/run.yaml
@@ -89,28 +89,28 @@ providers:
     config:
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/faiss_store.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/faiss_store.db
   - provider_id: sqlite-vec
     provider_type: inline::sqlite-vec
     config:
-      db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/sqlite_vec.db
+      db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/sqlite_vec.db
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/sqlite_vec_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/sqlite_vec_registry.db
   - provider_id: ${env.MILVUS_URL:+milvus}
     provider_type: inline::milvus
     config:
-      db_path: ${env.MILVUS_DB_PATH:=~/.llama/distributions/starter}/milvus.db
+      db_path: ${env.MILVUS_DB_PATH:=~/.llama/distributions/ci-tests}/milvus.db
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/milvus_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/milvus_registry.db
   - provider_id: ${env.CHROMADB_URL:+chromadb}
     provider_type: remote::chromadb
     config:
       url: ${env.CHROMADB_URL:=}
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter/}/chroma_remote_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests/}/chroma_remote_registry.db
   - provider_id: ${env.PGVECTOR_DB:+pgvector}
     provider_type: remote::pgvector
     config:
@@ -121,15 +121,15 @@ providers:
       password: ${env.PGVECTOR_PASSWORD:=}
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/pgvector_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/pgvector_registry.db
   files:
   - provider_id: meta-reference-files
     provider_type: inline::localfs
     config:
-      storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
+      storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/ci-tests/files}
       metadata_store:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/ci-tests}/files_metadata.db
   safety:
   - provider_id: llama-guard
     provider_type: inline::llama-guard
diff --git a/llama_stack/distributions/starter-gpu/run.yaml b/llama_stack/distributions/starter-gpu/run.yaml
index 8aed61519..5d9dfcb27 100644
--- a/llama_stack/distributions/starter-gpu/run.yaml
+++ b/llama_stack/distributions/starter-gpu/run.yaml
@@ -89,28 +89,28 @@ providers:
     config:
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/faiss_store.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter-gpu}/faiss_store.db
   - provider_id: sqlite-vec
     provider_type: inline::sqlite-vec
     config:
-      db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/sqlite_vec.db
+      db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter-gpu}/sqlite_vec.db
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/sqlite_vec_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter-gpu}/sqlite_vec_registry.db
   - provider_id: ${env.MILVUS_URL:+milvus}
     provider_type: inline::milvus
     config:
-      db_path: ${env.MILVUS_DB_PATH:=~/.llama/distributions/starter}/milvus.db
+      db_path: ${env.MILVUS_DB_PATH:=~/.llama/distributions/starter-gpu}/milvus.db
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/milvus_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter-gpu}/milvus_registry.db
   - provider_id: ${env.CHROMADB_URL:+chromadb}
     provider_type: remote::chromadb
     config:
       url: ${env.CHROMADB_URL:=}
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter/}/chroma_remote_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter-gpu/}/chroma_remote_registry.db
   - provider_id: ${env.PGVECTOR_DB:+pgvector}
     provider_type: remote::pgvector
     config:
@@ -121,15 +121,15 @@ providers:
       password: ${env.PGVECTOR_PASSWORD:=}
       kvstore:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/pgvector_registry.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter-gpu}/pgvector_registry.db
   files:
   - provider_id: meta-reference-files
     provider_type: inline::localfs
     config:
-      storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
+      storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter-gpu/files}
       metadata_store:
         type: sqlite
-        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter-gpu}/files_metadata.db
   safety:
   - provider_id: llama-guard
     provider_type: inline::llama-guard
diff --git a/llama_stack/distributions/starter-gpu/starter_gpu.py b/llama_stack/distributions/starter-gpu/starter_gpu.py
index 245334749..e7efcb283 100644
--- a/llama_stack/distributions/starter-gpu/starter_gpu.py
+++ b/llama_stack/distributions/starter-gpu/starter_gpu.py
@@ -11,9 +11,7 @@ from ..starter.starter import get_distribution_template as get_starter_distribut
 
 
 def get_distribution_template() -> DistributionTemplate:
-    template = get_starter_distribution_template()
-    name = "starter-gpu"
-    template.name = name
+    template = get_starter_distribution_template(name="starter-gpu")
     template.description = "Quick start template for running Llama Stack with several popular providers. This distribution is intended for GPU-enabled environments."
 
     template.providers["post_training"] = [
diff --git a/llama_stack/distributions/starter/starter.py b/llama_stack/distributions/starter/starter.py
index a4bbc6371..2fca52700 100644
--- a/llama_stack/distributions/starter/starter.py
+++ b/llama_stack/distributions/starter/starter.py
@@ -99,9 +99,8 @@ def get_remote_inference_providers() -> list[Provider]:
     return inference_providers
 
 
-def get_distribution_template() -> DistributionTemplate:
+def get_distribution_template(name: str = "starter") -> DistributionTemplate:
     remote_inference_providers = get_remote_inference_providers()
-    name = "starter"
 
     providers = {
         "inference": [BuildProvider(provider_type=p.provider_type, module=p.module) for p in remote_inference_providers]

From e2fe39aee108c1796ddc1be1e44acd25c800082e Mon Sep 17 00:00:00 2001
From: Francisco Arceo <arceofrancisco@gmail.com>
Date: Fri, 5 Sep 2025 07:40:34 -0600
Subject: [PATCH 17/76] feat!: Migrate Vector DB IDs to Vector Store IDs
 (breaking change) (#3253)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

# What does this PR do?
This change migrates the VectorDB id generation to Vector Stores.

This is a breaking change for **_some users_** that may have application
code using the `vector_db_id` parameter in the request of the VectorDB
protocol instead of the `VectorDB.identifier` in the response.

By default we will now create a Vector Store every time we register a
VectorDB. The caveat with this approach is that this maps the
`vector_db_id` → `vector_store.name`. This is a reasonable tradeoff to
transition users towards OpenAI Vector Stores.

As an added benefit, registering VectorDBs will result in them appearing
in the VectorStores admin UI.

### Why?
This PR makes the `POST` API call to `/v1/vector-dbs` swap the
`vector_db_id` parameter in the **request body** into the VectorStore's
name field and sets the `vector_db_id` to the generated vector store id
(e.g., `vs_038247dd-4bbb-4dbb-a6be-d5ecfd46cfdb`).

That means that users would have to do something like follows in their
application code:

```python
res = client.vector_dbs.register(
    vector_db_id='my-vector-db-id',
    embedding_model='ollama/all-minilm:l6-v2',
    embedding_dimension=384,
)
vector_db_id = res.identifier
```

And then the rest of their code would behave, including `VectorIO`'s
insert protocol using `vector_db_id` in the request.

An alternative implementation would be to just delete the `vector_db_id`
parameter in `VectorDB` but the end result would still require users
having to write `vector_db_id = res.identifier` since
`VectorStores.create()` generates the ID for you.

So this approach felt the easiest way to migrate users towards
VectorStores (subsequent PRs will be added to trigger `files.create()`
and `vector_stores.files.create()`).

## Test Plan
Unit tests and integration tests have been added.

Signed-off-by: Francisco Javier Arceo <farceo@redhat.com>
---
 llama_stack/core/routing_tables/vector_dbs.py |  26 +++-
 tests/integration/vector_io/test_vector_io.py |  75 +++++++----
 .../routers/test_routing_tables.py            |  30 ++++-
 .../routing_tables/test_vector_dbs.py         | 127 ++++++++++++++++--
 4 files changed, 209 insertions(+), 49 deletions(-)

diff --git a/llama_stack/core/routing_tables/vector_dbs.py b/llama_stack/core/routing_tables/vector_dbs.py
index 00f71b4fe..497894064 100644
--- a/llama_stack/core/routing_tables/vector_dbs.py
+++ b/llama_stack/core/routing_tables/vector_dbs.py
@@ -52,7 +52,6 @@ class VectorDBsRoutingTable(CommonRoutingTableImpl, VectorDBs):
         provider_vector_db_id: str | None = None,
         vector_db_name: str | None = None,
     ) -> VectorDB:
-        provider_vector_db_id = provider_vector_db_id or vector_db_id
         if provider_id is None:
             if len(self.impls_by_provider_id) > 0:
                 provider_id = list(self.impls_by_provider_id.keys())[0]
@@ -69,14 +68,33 @@ class VectorDBsRoutingTable(CommonRoutingTableImpl, VectorDBs):
             raise ModelTypeError(embedding_model, model.model_type, ModelType.embedding)
         if "embedding_dimension" not in model.metadata:
             raise ValueError(f"Model {embedding_model} does not have an embedding dimension")
+
+        provider = self.impls_by_provider_id[provider_id]
+        logger.warning(
+            "VectorDB is being deprecated in future releases in favor of VectorStore. Please migrate your usage accordingly."
+        )
+        vector_store = await provider.openai_create_vector_store(
+            name=vector_db_name or vector_db_id,
+            embedding_model=embedding_model,
+            embedding_dimension=model.metadata["embedding_dimension"],
+            provider_id=provider_id,
+            provider_vector_db_id=provider_vector_db_id,
+        )
+
+        vector_store_id = vector_store.id
+        actual_provider_vector_db_id = provider_vector_db_id or vector_store_id
+        logger.warning(
+            f"Ignoring vector_db_id {vector_db_id} and using vector_store_id {vector_store_id} instead. Setting VectorDB {vector_db_id} to VectorDB.vector_db_name"
+        )
+
         vector_db_data = {
-            "identifier": vector_db_id,
+            "identifier": vector_store_id,
             "type": ResourceType.vector_db.value,
             "provider_id": provider_id,
-            "provider_resource_id": provider_vector_db_id,
+            "provider_resource_id": actual_provider_vector_db_id,
             "embedding_model": embedding_model,
             "embedding_dimension": model.metadata["embedding_dimension"],
-            "vector_db_name": vector_db_name,
+            "vector_db_name": vector_store.name,
         }
         vector_db = TypeAdapter(VectorDBWithOwner).validate_python(vector_db_data)
         await self.register_object(vector_db)
diff --git a/tests/integration/vector_io/test_vector_io.py b/tests/integration/vector_io/test_vector_io.py
index 07faa0db1..979eff6bb 100644
--- a/tests/integration/vector_io/test_vector_io.py
+++ b/tests/integration/vector_io/test_vector_io.py
@@ -47,34 +47,45 @@ def client_with_empty_registry(client_with_models):
 
 
 def test_vector_db_retrieve(client_with_empty_registry, embedding_model_id, embedding_dimension):
-    # Register a memory bank first
-    vector_db_id = "test_vector_db"
-    client_with_empty_registry.vector_dbs.register(
-        vector_db_id=vector_db_id,
+    vector_db_name = "test_vector_db"
+    register_response = client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_name,
         embedding_model=embedding_model_id,
         embedding_dimension=embedding_dimension,
     )
 
+    actual_vector_db_id = register_response.identifier
+
     # Retrieve the memory bank and validate its properties
-    response = client_with_empty_registry.vector_dbs.retrieve(vector_db_id=vector_db_id)
+    response = client_with_empty_registry.vector_dbs.retrieve(vector_db_id=actual_vector_db_id)
     assert response is not None
-    assert response.identifier == vector_db_id
+    assert response.identifier == actual_vector_db_id
     assert response.embedding_model == embedding_model_id
-    assert response.provider_resource_id == vector_db_id
+    assert response.identifier.startswith("vs_")
 
 
 def test_vector_db_register(client_with_empty_registry, embedding_model_id, embedding_dimension):
-    vector_db_id = "test_vector_db"
-    client_with_empty_registry.vector_dbs.register(
-        vector_db_id=vector_db_id,
+    vector_db_name = "test_vector_db"
+    response = client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_name,
         embedding_model=embedding_model_id,
         embedding_dimension=embedding_dimension,
     )
 
-    vector_dbs_after_register = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
-    assert vector_dbs_after_register == [vector_db_id]
+    actual_vector_db_id = response.identifier
+    assert actual_vector_db_id.startswith("vs_")
+    assert actual_vector_db_id != vector_db_name
 
-    client_with_empty_registry.vector_dbs.unregister(vector_db_id=vector_db_id)
+    vector_dbs_after_register = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
+    assert vector_dbs_after_register == [actual_vector_db_id]
+
+    vector_stores = client_with_empty_registry.vector_stores.list()
+    assert len(vector_stores.data) == 1
+    vector_store = vector_stores.data[0]
+    assert vector_store.id == actual_vector_db_id
+    assert vector_store.name == vector_db_name
+
+    client_with_empty_registry.vector_dbs.unregister(vector_db_id=actual_vector_db_id)
 
     vector_dbs = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
     assert len(vector_dbs) == 0
@@ -91,20 +102,22 @@ def test_vector_db_register(client_with_empty_registry, embedding_model_id, embe
     ],
 )
 def test_insert_chunks(client_with_empty_registry, embedding_model_id, embedding_dimension, sample_chunks, test_case):
-    vector_db_id = "test_vector_db"
-    client_with_empty_registry.vector_dbs.register(
-        vector_db_id=vector_db_id,
+    vector_db_name = "test_vector_db"
+    register_response = client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_name,
         embedding_model=embedding_model_id,
         embedding_dimension=embedding_dimension,
     )
 
+    actual_vector_db_id = register_response.identifier
+
     client_with_empty_registry.vector_io.insert(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         chunks=sample_chunks,
     )
 
     response = client_with_empty_registry.vector_io.query(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         query="What is the capital of France?",
     )
     assert response is not None
@@ -113,7 +126,7 @@ def test_insert_chunks(client_with_empty_registry, embedding_model_id, embedding
 
     query, expected_doc_id = test_case
     response = client_with_empty_registry.vector_io.query(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         query=query,
     )
     assert response is not None
@@ -128,13 +141,15 @@ def test_insert_chunks_with_precomputed_embeddings(client_with_empty_registry, e
         "remote::qdrant": {"score_threshold": -1.0},
         "inline::qdrant": {"score_threshold": -1.0},
     }
-    vector_db_id = "test_precomputed_embeddings_db"
-    client_with_empty_registry.vector_dbs.register(
-        vector_db_id=vector_db_id,
+    vector_db_name = "test_precomputed_embeddings_db"
+    register_response = client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_name,
         embedding_model=embedding_model_id,
         embedding_dimension=embedding_dimension,
     )
 
+    actual_vector_db_id = register_response.identifier
+
     chunks_with_embeddings = [
         Chunk(
             content="This is a test chunk with precomputed embedding.",
@@ -144,13 +159,13 @@ def test_insert_chunks_with_precomputed_embeddings(client_with_empty_registry, e
     ]
 
     client_with_empty_registry.vector_io.insert(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         chunks=chunks_with_embeddings,
     )
 
     provider = [p.provider_id for p in client_with_empty_registry.providers.list() if p.api == "vector_io"][0]
     response = client_with_empty_registry.vector_io.query(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         query="precomputed embedding test",
         params=vector_io_provider_params_dict.get(provider, None),
     )
@@ -173,13 +188,15 @@ def test_query_returns_valid_object_when_identical_to_embedding_in_vdb(
         "remote::qdrant": {"score_threshold": 0.0},
         "inline::qdrant": {"score_threshold": 0.0},
     }
-    vector_db_id = "test_precomputed_embeddings_db"
-    client_with_empty_registry.vector_dbs.register(
-        vector_db_id=vector_db_id,
+    vector_db_name = "test_precomputed_embeddings_db"
+    register_response = client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_name,
         embedding_model=embedding_model_id,
         embedding_dimension=embedding_dimension,
     )
 
+    actual_vector_db_id = register_response.identifier
+
     chunks_with_embeddings = [
         Chunk(
             content="duplicate",
@@ -189,13 +206,13 @@ def test_query_returns_valid_object_when_identical_to_embedding_in_vdb(
     ]
 
     client_with_empty_registry.vector_io.insert(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         chunks=chunks_with_embeddings,
     )
 
     provider = [p.provider_id for p in client_with_empty_registry.providers.list() if p.api == "vector_io"][0]
     response = client_with_empty_registry.vector_io.query(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         query="duplicate",
         params=vector_io_provider_params_dict.get(provider, None),
     )
diff --git a/tests/unit/distribution/routers/test_routing_tables.py b/tests/unit/distribution/routers/test_routing_tables.py
index 2652f5c8d..1ceee81c6 100644
--- a/tests/unit/distribution/routers/test_routing_tables.py
+++ b/tests/unit/distribution/routers/test_routing_tables.py
@@ -146,6 +146,20 @@ class VectorDBImpl(Impl):
     async def unregister_vector_db(self, vector_db_id: str):
         return vector_db_id
 
+    async def openai_create_vector_store(self, **kwargs):
+        import time
+        import uuid
+
+        from llama_stack.apis.vector_io.vector_io import VectorStoreFileCounts, VectorStoreObject
+
+        vector_store_id = kwargs.get("provider_vector_db_id") or f"vs_{uuid.uuid4()}"
+        return VectorStoreObject(
+            id=vector_store_id,
+            name=kwargs.get("name", vector_store_id),
+            created_at=int(time.time()),
+            file_counts=VectorStoreFileCounts(completed=0, cancelled=0, failed=0, in_progress=0, total=0),
+        )
+
 
 async def test_models_routing_table(cached_disk_dist_registry):
     table = ModelsRoutingTable({"test_provider": InferenceImpl()}, cached_disk_dist_registry, {})
@@ -247,17 +261,21 @@ async def test_vectordbs_routing_table(cached_disk_dist_registry):
     )
 
     # Register multiple vector databases and verify listing
-    await table.register_vector_db(vector_db_id="test-vectordb", embedding_model="test_provider/test-model")
-    await table.register_vector_db(vector_db_id="test-vectordb-2", embedding_model="test_provider/test-model")
+    vdb1 = await table.register_vector_db(vector_db_id="test-vectordb", embedding_model="test_provider/test-model")
+    vdb2 = await table.register_vector_db(vector_db_id="test-vectordb-2", embedding_model="test_provider/test-model")
     vector_dbs = await table.list_vector_dbs()
 
     assert len(vector_dbs.data) == 2
     vector_db_ids = {v.identifier for v in vector_dbs.data}
-    assert "test-vectordb" in vector_db_ids
-    assert "test-vectordb-2" in vector_db_ids
+    assert vdb1.identifier in vector_db_ids
+    assert vdb2.identifier in vector_db_ids
 
-    await table.unregister_vector_db(vector_db_id="test-vectordb")
-    await table.unregister_vector_db(vector_db_id="test-vectordb-2")
+    # Verify they have UUID-based identifiers
+    assert vdb1.identifier.startswith("vs_")
+    assert vdb2.identifier.startswith("vs_")
+
+    await table.unregister_vector_db(vector_db_id=vdb1.identifier)
+    await table.unregister_vector_db(vector_db_id=vdb2.identifier)
 
     vector_dbs = await table.list_vector_dbs()
     assert len(vector_dbs.data) == 0
diff --git a/tests/unit/distribution/routing_tables/test_vector_dbs.py b/tests/unit/distribution/routing_tables/test_vector_dbs.py
index 789eda433..3444f64c2 100644
--- a/tests/unit/distribution/routing_tables/test_vector_dbs.py
+++ b/tests/unit/distribution/routing_tables/test_vector_dbs.py
@@ -7,6 +7,7 @@
 # Unit tests for the routing tables vector_dbs
 
 import time
+import uuid
 from unittest.mock import AsyncMock
 
 import pytest
@@ -34,6 +35,7 @@ from tests.unit.distribution.routers.test_routing_tables import Impl, InferenceI
 class VectorDBImpl(Impl):
     def __init__(self):
         super().__init__(Api.vector_io)
+        self.vector_stores = {}
 
     async def register_vector_db(self, vector_db: VectorDB):
         return vector_db
@@ -114,8 +116,35 @@ class VectorDBImpl(Impl):
     async def openai_delete_vector_store_file(self, vector_store_id, file_id):
         return VectorStoreFileDeleteResponse(id=file_id, deleted=True)
 
+    async def openai_create_vector_store(
+        self,
+        name=None,
+        embedding_model=None,
+        embedding_dimension=None,
+        provider_id=None,
+        provider_vector_db_id=None,
+        **kwargs,
+    ):
+        vector_store_id = provider_vector_db_id or f"vs_{uuid.uuid4()}"
+        vector_store = VectorStoreObject(
+            id=vector_store_id,
+            name=name or vector_store_id,
+            created_at=int(time.time()),
+            file_counts=VectorStoreFileCounts(completed=0, cancelled=0, failed=0, in_progress=0, total=0),
+        )
+        self.vector_stores[vector_store_id] = vector_store
+        return vector_store
+
+    async def openai_list_vector_stores(self, **kwargs):
+        from llama_stack.apis.vector_io.vector_io import VectorStoreListResponse
+
+        return VectorStoreListResponse(
+            data=list(self.vector_stores.values()), has_more=False, first_id=None, last_id=None
+        )
+
 
 async def test_vectordbs_routing_table(cached_disk_dist_registry):
+    n = 10
     table = VectorDBsRoutingTable({"test_provider": VectorDBImpl()}, cached_disk_dist_registry, {})
     await table.initialize()
 
@@ -129,22 +158,98 @@ async def test_vectordbs_routing_table(cached_disk_dist_registry):
     )
 
     # Register multiple vector databases and verify listing
-    await table.register_vector_db(vector_db_id="test-vectordb", embedding_model="test-model")
-    await table.register_vector_db(vector_db_id="test-vectordb-2", embedding_model="test-model")
+    vdb_dict = {}
+    for i in range(n):
+        vdb_dict[i] = await table.register_vector_db(vector_db_id=f"test-vectordb-{i}", embedding_model="test-model")
+
     vector_dbs = await table.list_vector_dbs()
 
-    assert len(vector_dbs.data) == 2
+    assert len(vector_dbs.data) == len(vdb_dict)
     vector_db_ids = {v.identifier for v in vector_dbs.data}
-    assert "test-vectordb" in vector_db_ids
-    assert "test-vectordb-2" in vector_db_ids
-
-    await table.unregister_vector_db(vector_db_id="test-vectordb")
-    await table.unregister_vector_db(vector_db_id="test-vectordb-2")
+    for k in vdb_dict:
+        assert vdb_dict[k].identifier in vector_db_ids
+    for k in vdb_dict:
+        await table.unregister_vector_db(vector_db_id=vdb_dict[k].identifier)
 
     vector_dbs = await table.list_vector_dbs()
     assert len(vector_dbs.data) == 0
 
 
+async def test_vector_db_and_vector_store_id_mapping(cached_disk_dist_registry):
+    n = 10
+    impl = VectorDBImpl()
+    table = VectorDBsRoutingTable({"test_provider": impl}, cached_disk_dist_registry, {})
+    await table.initialize()
+
+    m_table = ModelsRoutingTable({"test_provider": InferenceImpl()}, cached_disk_dist_registry, {})
+    await m_table.initialize()
+    await m_table.register_model(
+        model_id="test-model",
+        provider_id="test_provider",
+        metadata={"embedding_dimension": 128},
+        model_type=ModelType.embedding,
+    )
+
+    vdb_dict = {}
+    for i in range(n):
+        vdb_dict[i] = await table.register_vector_db(vector_db_id=f"test-vectordb-{i}", embedding_model="test-model")
+
+    vector_dbs = await table.list_vector_dbs()
+    vector_db_ids = {v.identifier for v in vector_dbs.data}
+
+    vector_stores = await impl.openai_list_vector_stores()
+    vector_store_ids = {v.id for v in vector_stores.data}
+
+    assert vector_db_ids == vector_store_ids, (
+        f"Vector DB IDs {vector_db_ids} don't match vector store IDs {vector_store_ids}"
+    )
+
+    for vector_store in vector_stores.data:
+        vector_db = await table.get_vector_db(vector_store.id)
+        assert vector_store.name == vector_db.vector_db_name, (
+            f"Vector store name {vector_store.name} doesn't match vector store ID {vector_store.id}"
+        )
+
+    for vector_db_id in vector_db_ids:
+        await table.unregister_vector_db(vector_db_id)
+
+    assert len((await table.list_vector_dbs()).data) == 0
+
+
+async def test_vector_db_id_becomes_vector_store_name(cached_disk_dist_registry):
+    impl = VectorDBImpl()
+    table = VectorDBsRoutingTable({"test_provider": impl}, cached_disk_dist_registry, {})
+    await table.initialize()
+
+    m_table = ModelsRoutingTable({"test_provider": InferenceImpl()}, cached_disk_dist_registry, {})
+    await m_table.initialize()
+    await m_table.register_model(
+        model_id="test-model",
+        provider_id="test_provider",
+        metadata={"embedding_dimension": 128},
+        model_type=ModelType.embedding,
+    )
+
+    user_provided_id = "my-custom-vector-db"
+    await table.register_vector_db(vector_db_id=user_provided_id, embedding_model="test-model")
+
+    vector_stores = await impl.openai_list_vector_stores()
+    assert len(vector_stores.data) == 1
+
+    vector_store = vector_stores.data[0]
+
+    assert vector_store.name == user_provided_id
+
+    assert vector_store.id.startswith("vs_")
+    assert vector_store.id != user_provided_id
+
+    vector_dbs = await table.list_vector_dbs()
+    assert len(vector_dbs.data) == 1
+    assert vector_dbs.data[0].identifier == vector_store.id
+
+    await table.unregister_vector_db(vector_store.id)
+
+
 async def test_openai_vector_stores_routing_table_roles(cached_disk_dist_registry):
     impl = VectorDBImpl()
     impl.openai_retrieve_vector_store = AsyncMock(return_value="OK")
@@ -164,7 +269,8 @@ async def test_openai_vector_stores_routing_table_roles(cached_disk_dist_registr
 
     authorized_user = User(principal="alice", attributes={"roles": [authorized_team]})
     with request_provider_data_context({}, authorized_user):
-        _ = await table.register_vector_db(vector_db_id="vs1", embedding_model="test-model")
+        registered_vdb = await table.register_vector_db(vector_db_id="vs1", embedding_model="test-model")
+        authorized_table = registered_vdb.identifier  # Use the actual generated ID
 
     # Authorized reader
     with request_provider_data_context({}, authorized_user):
@@ -227,7 +333,8 @@ async def test_openai_vector_stores_routing_table_actions(cached_disk_dist_regis
     )
 
     with request_provider_data_context({}, admin_user):
-        await table.register_vector_db(vector_db_id=vector_db_id, embedding_model="test-model")
+        registered_vdb = await table.register_vector_db(vector_db_id=vector_db_id, embedding_model="test-model")
+        vector_db_id = registered_vdb.identifier  # Use the actual generated ID
 
     read_methods = [
         (table.openai_retrieve_vector_store, (vector_db_id,), {}),

From df1526991f6d5cfca05d3c4f1077b67f4832d93e Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Fri, 5 Sep 2025 14:59:57 -0400
Subject: [PATCH 18/76] feat(batches, completions): add /v1/completions support
 to /v1/batches (#3309)

# What does this PR do?

add support for /v1/completions to the /v1/batches api


## Test Plan

ci
---
 .../inline/batches/reference/batches.py       | 69 +++++++++++++------
 tests/integration/batches/test_batches.py     | 55 +++++++++++++++
 .../recordings/responses/41e27b9b5d09.json    | 42 +++++++++++
 .../unit/providers/batches/test_reference.py  | 65 +++++++++++++++--
 4 files changed, 205 insertions(+), 26 deletions(-)
 create mode 100644 tests/integration/recordings/responses/41e27b9b5d09.json

diff --git a/llama_stack/providers/inline/batches/reference/batches.py b/llama_stack/providers/inline/batches/reference/batches.py
index 26f0ad15a..e049518a4 100644
--- a/llama_stack/providers/inline/batches/reference/batches.py
+++ b/llama_stack/providers/inline/batches/reference/batches.py
@@ -178,9 +178,9 @@ class ReferenceBatchesImpl(Batches):
 
         # TODO: set expiration time for garbage collection
 
-        if endpoint not in ["/v1/chat/completions"]:
+        if endpoint not in ["/v1/chat/completions", "/v1/completions"]:
             raise ValueError(
-                f"Invalid endpoint: {endpoint}. Supported values: /v1/chat/completions. Code: invalid_value. Param: endpoint",
+                f"Invalid endpoint: {endpoint}. Supported values: /v1/chat/completions, /v1/completions. Code: invalid_value. Param: endpoint",
             )
 
         if completion_window != "24h":
@@ -424,13 +424,21 @@ class ReferenceBatchesImpl(Batches):
                             )
                             valid = False
 
-                        for param, expected_type, type_string in [
-                            ("model", str, "a string"),
-                            # messages is specific to /v1/chat/completions
-                            # we could skip validating messages here and let inference fail. however,
-                            # that would be a very expensive way to find out messages is wrong.
-                            ("messages", list, "an array"),  # TODO: allow messages to be a string?
-                        ]:
+                        if batch.endpoint == "/v1/chat/completions":
+                            required_params = [
+                                ("model", str, "a string"),
+                                # messages is specific to /v1/chat/completions
+                                # we could skip validating messages here and let inference fail. however,
+                                # that would be a very expensive way to find out messages is wrong.
+                                ("messages", list, "an array"),  # TODO: allow messages to be a string?
+                            ]
+                        else:  # /v1/completions
+                            required_params = [
+                                ("model", str, "a string"),
+                                ("prompt", str, "a string"),  # TODO: allow prompt to be a list of strings??
+                            ]
+
+                        for param, expected_type, type_string in required_params:
                             if param not in body:
                                 errors.append(
                                     BatchError(
@@ -591,20 +599,37 @@ class ReferenceBatchesImpl(Batches):
 
         try:
             # TODO(SECURITY): review body for security issues
-            request.body["messages"] = [convert_to_openai_message_param(msg) for msg in request.body["messages"]]
-            chat_response = await self.inference_api.openai_chat_completion(**request.body)
+            if request.url == "/v1/chat/completions":
+                request.body["messages"] = [convert_to_openai_message_param(msg) for msg in request.body["messages"]]
+                chat_response = await self.inference_api.openai_chat_completion(**request.body)
 
-            # this is for mypy, we don't allow streaming so we'll get the right type
-            assert hasattr(chat_response, "model_dump_json"), "Chat response must have model_dump_json method"
-            return {
-                "id": request_id,
-                "custom_id": request.custom_id,
-                "response": {
-                    "status_code": 200,
-                    "request_id": request_id,  # TODO: should this be different?
-                    "body": chat_response.model_dump_json(),
-                },
-            }
+                # this is for mypy, we don't allow streaming so we'll get the right type
+                assert hasattr(chat_response, "model_dump_json"), "Chat response must have model_dump_json method"
+                return {
+                    "id": request_id,
+                    "custom_id": request.custom_id,
+                    "response": {
+                        "status_code": 200,
+                        "request_id": request_id,  # TODO: should this be different?
+                        "body": chat_response.model_dump_json(),
+                    },
+                }
+            else:  # /v1/completions
+                completion_response = await self.inference_api.openai_completion(**request.body)
+
+                # this is for mypy, we don't allow streaming so we'll get the right type
+                assert hasattr(completion_response, "model_dump_json"), (
+                    "Completion response must have model_dump_json method"
+                )
+                return {
+                    "id": request_id,
+                    "custom_id": request.custom_id,
+                    "response": {
+                        "status_code": 200,
+                        "request_id": request_id,
+                        "body": completion_response.model_dump_json(),
+                    },
+                }
         except Exception as e:
             logger.info(f"Error processing request {request.custom_id} in batch {batch_id}: {e}")
             return {
diff --git a/tests/integration/batches/test_batches.py b/tests/integration/batches/test_batches.py
index 59811b7a4..d55a68bd3 100644
--- a/tests/integration/batches/test_batches.py
+++ b/tests/integration/batches/test_batches.py
@@ -268,3 +268,58 @@ class TestBatchesIntegration:
 
         deleted_error_file = openai_client.files.delete(final_batch.error_file_id)
         assert deleted_error_file.deleted, f"Error file {final_batch.error_file_id} was not deleted successfully"
+
+    def test_batch_e2e_completions(self, openai_client, batch_helper, text_model_id):
+        """Run an end-to-end batch with a single successful text completion request."""
+        request_body = {"model": text_model_id, "prompt": "Say completions", "max_tokens": 20}
+
+        batch_requests = [
+            {
+                "custom_id": "success-1",
+                "method": "POST",
+                "url": "/v1/completions",
+                "body": request_body,
+            }
+        ]
+
+        with batch_helper.create_file(batch_requests) as uploaded_file:
+            batch = openai_client.batches.create(
+                input_file_id=uploaded_file.id,
+                endpoint="/v1/completions",
+                completion_window="24h",
+                metadata={"test": "e2e_completions_success"},
+            )
+
+            final_batch = batch_helper.wait_for(
+                batch.id,
+                max_wait_time=3 * 60,
+                expected_statuses={"completed"},
+                timeout_action="skip",
+            )
+
+        assert final_batch.status == "completed"
+        assert final_batch.request_counts is not None
+        assert final_batch.request_counts.total == 1
+        assert final_batch.request_counts.completed == 1
+        assert final_batch.output_file_id is not None
+
+        output_content = openai_client.files.content(final_batch.output_file_id)
+        if isinstance(output_content, str):
+            output_text = output_content
+        else:
+            output_text = output_content.content.decode("utf-8")
+
+        output_lines = output_text.strip().split("\n")
+        assert len(output_lines) == 1
+
+        result = json.loads(output_lines[0])
+        assert result["custom_id"] == "success-1"
+        assert "response" in result
+        assert result["response"]["status_code"] == 200
+
+        deleted_output_file = openai_client.files.delete(final_batch.output_file_id)
+        assert deleted_output_file.deleted
+
+        if final_batch.error_file_id is not None:
+            deleted_error_file = openai_client.files.delete(final_batch.error_file_id)
+            assert deleted_error_file.deleted
diff --git a/tests/integration/recordings/responses/41e27b9b5d09.json b/tests/integration/recordings/responses/41e27b9b5d09.json
new file mode 100644
index 000000000..45d140843
--- /dev/null
+++ b/tests/integration/recordings/responses/41e27b9b5d09.json
@@ -0,0 +1,42 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "http://0.0.0.0:11434/v1/v1/completions",
+    "headers": {},
+    "body": {
+      "model": "llama3.2:3b-instruct-fp16",
+      "prompt": "Say completions",
+      "max_tokens": 20
+    },
+    "endpoint": "/v1/completions",
+    "model": "llama3.2:3b-instruct-fp16"
+  },
+  "response": {
+    "body": {
+      "__type__": "openai.types.completion.Completion",
+      "__data__": {
+        "id": "cmpl-271",
+        "choices": [
+          {
+            "finish_reason": "length",
+            "index": 0,
+            "logprobs": null,
+            "text": "You want me to respond with a completion, but you didn't specify what I should complete. Could"
+          }
+        ],
+        "created": 1756846620,
+        "model": "llama3.2:3b-instruct-fp16",
+        "object": "text_completion",
+        "system_fingerprint": "fp_ollama",
+        "usage": {
+          "completion_tokens": 20,
+          "prompt_tokens": 28,
+          "total_tokens": 48,
+          "completion_tokens_details": null,
+          "prompt_tokens_details": null
+        }
+      }
+    },
+    "is_streaming": false
+  }
+}
diff --git a/tests/unit/providers/batches/test_reference.py b/tests/unit/providers/batches/test_reference.py
index 0ca866f7b..dfef5e040 100644
--- a/tests/unit/providers/batches/test_reference.py
+++ b/tests/unit/providers/batches/test_reference.py
@@ -46,7 +46,8 @@ The tests are categorized and outlined below, keep this updated:
   * test_validate_input_url_mismatch (negative)
   * test_validate_input_multiple_errors_per_request (negative)
   * test_validate_input_invalid_request_format (negative)
-  * test_validate_input_missing_parameters (parametrized negative - custom_id, method, url, body, model, messages missing validation)
+  * test_validate_input_missing_parameters_chat_completions (parametrized negative - custom_id, method, url, body, model, messages missing validation for chat/completions)
+  * test_validate_input_missing_parameters_completions (parametrized negative - custom_id, method, url, body, model, prompt missing validation for completions)
   * test_validate_input_invalid_parameter_types (parametrized negative - custom_id, url, method, body, model, messages type validation)
 
 The tests use temporary SQLite databases for isolation and mock external
@@ -213,7 +214,6 @@ class TestReferenceBatchesImpl:
         "endpoint",
         [
             "/v1/embeddings",
-            "/v1/completions",
             "/v1/invalid/endpoint",
             "",
         ],
@@ -499,8 +499,10 @@ class TestReferenceBatchesImpl:
             ("messages", "body.messages", "invalid_request", "Messages parameter is required"),
         ],
     )
-    async def test_validate_input_missing_parameters(self, provider, param_name, param_path, error_code, error_message):
-        """Test _validate_input when file contains request with missing required parameters."""
+    async def test_validate_input_missing_parameters_chat_completions(
+        self, provider, param_name, param_path, error_code, error_message
+    ):
+        """Test _validate_input when file contains request with missing required parameters for chat completions."""
         provider.files_api.openai_retrieve_file = AsyncMock()
         mock_response = MagicMock()
 
@@ -541,6 +543,61 @@ class TestReferenceBatchesImpl:
         assert errors[0].message == error_message
         assert errors[0].param == param_path
 
+    @pytest.mark.parametrize(
+        "param_name,param_path,error_code,error_message",
+        [
+            ("custom_id", "custom_id", "missing_required_parameter", "Missing required parameter: custom_id"),
+            ("method", "method", "missing_required_parameter", "Missing required parameter: method"),
+            ("url", "url", "missing_required_parameter", "Missing required parameter: url"),
+            ("body", "body", "missing_required_parameter", "Missing required parameter: body"),
+            ("model", "body.model", "invalid_request", "Model parameter is required"),
+            ("prompt", "body.prompt", "invalid_request", "Prompt parameter is required"),
+        ],
+    )
+    async def test_validate_input_missing_parameters_completions(
+        self, provider, param_name, param_path, error_code, error_message
+    ):
+        """Test _validate_input when file contains request with missing required parameters for text completions."""
+        provider.files_api.openai_retrieve_file = AsyncMock()
+        mock_response = MagicMock()
+
+        base_request = {
+            "custom_id": "req-1",
+            "method": "POST",
+            "url": "/v1/completions",
+            "body": {"model": "test-model", "prompt": "Hello"},
+        }
+
+        # Remove the specific parameter being tested
+        if "." in param_path:
+            top_level, nested_param = param_path.split(".", 1)
+            del base_request[top_level][nested_param]
+        else:
+            del base_request[param_name]
+
+        mock_response.body = json.dumps(base_request).encode()
+        provider.files_api.openai_retrieve_file_content = AsyncMock(return_value=mock_response)
+
+        batch = BatchObject(
+            id="batch_test",
+            object="batch",
+            endpoint="/v1/completions",
+            input_file_id=f"missing_{param_name}_file",
+            completion_window="24h",
+            status="validating",
+            created_at=1234567890,
+        )
+
+        errors, requests = await provider._validate_input(batch)
+
+        assert len(errors) == 1
+        assert len(requests) == 0
+
+        assert errors[0].code == error_code
+        assert errors[0].line == 1
+        assert errors[0].message == error_message
+        assert errors[0].param == param_path
+
     async def test_validate_input_url_mismatch(self, provider):
         """Test _validate_input when file contains request with URL that doesn't match batch endpoint."""
         provider.files_api.openai_retrieve_file = AsyncMock()

From 0c2757a05b504bafef1bc589376712b9ac9a1c52 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Fri, 5 Sep 2025 15:00:09 -0400
Subject: [PATCH 19/76] chore(sambanova test): skip with_n tests for sambanova,
 it is not implemented server-side (#3342)

# What does this PR do?

skip a test that cannot pass for sambanova

see
https://docs-legacy.sambanova.ai/sambastudio/latest/open-ai-api.html\#_example_requests_using_openai_client

## Test Plan

ci
---
 .../inference/test_openai_completion.py            | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index 62185e470..bb447b3c1 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -58,6 +58,15 @@ def skip_if_model_doesnt_support_suffix(client_with_models, model_id):
         pytest.skip(f"Provider {provider.provider_type} doesn't support suffix.")
 
 
+def skip_if_doesnt_support_n(client_with_models, model_id):
+    provider = provider_from_model(client_with_models, model_id)
+    if provider.provider_type in (
+        "remote::sambanova",
+        "remote::ollama",
+    ):
+        pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support n param.")
+
+
 def skip_if_model_doesnt_support_openai_chat_completion(client_with_models, model_id):
     provider = provider_from_model(client_with_models, model_id)
     if provider.provider_type in (
@@ -262,10 +271,7 @@ def test_openai_chat_completion_streaming(compat_client, client_with_models, tex
 )
 def test_openai_chat_completion_streaming_with_n(compat_client, client_with_models, text_model_id, test_case):
     skip_if_model_doesnt_support_openai_chat_completion(client_with_models, text_model_id)
-
-    provider = provider_from_model(client_with_models, text_model_id)
-    if provider.provider_type == "remote::ollama":
-        pytest.skip(f"Model {text_model_id} hosted by {provider.provider_type} doesn't support n > 1.")
+    skip_if_doesnt_support_n(client_with_models, text_model_id)
 
     tc = TestCase(test_case)
     question = tc["question"]

From 47b640370e275dd178c0bb9fcf822467e032120d Mon Sep 17 00:00:00 2001
From: Ashwin Bharambe <ashwin.bharambe@gmail.com>
Date: Fri, 5 Sep 2025 13:58:49 -0700
Subject: [PATCH 20/76] feat(tests): introduce a test "suite" concept to
 encompass dirs, options (#3339)

Our integration tests need to be 'grouped' because each group often
needs a specific set of models it works with. We separated vision tests
due to this, and we have a separate set of tests which test "Responses"
API.

This PR makes this system a bit more official so it is very easy to
target these groups and apply all testing infrastructure towards all the
groups (for example, record-replay) uniformly.

There are three suites declared:
- base
- vision
- responses

Note that our CI currently runs the "base" and "vision" suites.

You can use the `--suite` option when running pytest (or any of the
testing scripts or workflows.) For example:
```
OLLAMA_URL=http://localhost:11434 \
  pytest -s -v tests/integration/ --stack-config starter --suite vision
```
---
 .../actions/run-and-record-tests/action.yml   |  30 ++--
 .github/actions/setup-ollama/action.yml       |   8 +-
 .../actions/setup-test-environment/action.yml |   8 +-
 .github/workflows/README.md                   |   2 +-
 .github/workflows/integration-tests.yml       |  20 +--
 .../workflows/record-integration-tests.yml    |  32 ++---
 scripts/github/schedule-record-workflow.sh    |  32 +++--
 scripts/integration-tests.sh                  | 133 +++++++-----------
 tests/README.md                               |   2 +-
 tests/integration/README.md                   |  21 +++
 tests/integration/conftest.py                 |  75 ++++++++--
 .../{non_ci => }/responses/__init__.py        |   0
 .../responses/fixtures/__init__.py            |   0
 .../responses/fixtures/fixtures.py            |   0
 .../fixtures/images/vision_test_1.jpg         | Bin
 .../fixtures/images/vision_test_2.jpg         | Bin
 .../fixtures/images/vision_test_3.jpg         | Bin
 .../fixtures/pdfs/llama_stack_and_models.pdf  | Bin
 .../responses/fixtures/test_cases.py          |   0
 .../{non_ci => }/responses/helpers.py         |   0
 .../responses/streaming_assertions.py         |   0
 .../responses/test_basic_responses.py         |   0
 .../responses/test_file_search.py             |   0
 .../responses/test_tool_responses.py          |   0
 tests/integration/suites.py                   |  53 +++++++
 25 files changed, 255 insertions(+), 161 deletions(-)
 rename tests/integration/{non_ci => }/responses/__init__.py (100%)
 rename tests/integration/{non_ci => }/responses/fixtures/__init__.py (100%)
 rename tests/integration/{non_ci => }/responses/fixtures/fixtures.py (100%)
 rename tests/integration/{non_ci => }/responses/fixtures/images/vision_test_1.jpg (100%)
 rename tests/integration/{non_ci => }/responses/fixtures/images/vision_test_2.jpg (100%)
 rename tests/integration/{non_ci => }/responses/fixtures/images/vision_test_3.jpg (100%)
 rename tests/integration/{non_ci => }/responses/fixtures/pdfs/llama_stack_and_models.pdf (100%)
 rename tests/integration/{non_ci => }/responses/fixtures/test_cases.py (100%)
 rename tests/integration/{non_ci => }/responses/helpers.py (100%)
 rename tests/integration/{non_ci => }/responses/streaming_assertions.py (100%)
 rename tests/integration/{non_ci => }/responses/test_basic_responses.py (100%)
 rename tests/integration/{non_ci => }/responses/test_file_search.py (100%)
 rename tests/integration/{non_ci => }/responses/test_tool_responses.py (100%)
 create mode 100644 tests/integration/suites.py

diff --git a/.github/actions/run-and-record-tests/action.yml b/.github/actions/run-and-record-tests/action.yml
index 60550cfdc..7f028b104 100644
--- a/.github/actions/run-and-record-tests/action.yml
+++ b/.github/actions/run-and-record-tests/action.yml
@@ -2,13 +2,6 @@ name: 'Run and Record Tests'
 description: 'Run integration tests and handle recording/artifact upload'
 
 inputs:
-  test-subdirs:
-    description: 'Comma-separated list of test subdirectories to run'
-    required: true
-  test-pattern:
-    description: 'Regex pattern to pass to pytest -k'
-    required: false
-    default: ''
   stack-config:
     description: 'Stack configuration to use'
     required: true
@@ -18,10 +11,18 @@ inputs:
   inference-mode:
     description: 'Inference mode (record or replay)'
     required: true
-  run-vision-tests:
-    description: 'Whether to run vision tests'
+  test-suite:
+    description: 'Test suite to use: base, responses, vision, etc.'
     required: false
-    default: 'false'
+    default: ''
+  test-subdirs:
+    description: 'Comma-separated list of test subdirectories to run; overrides test-suite'
+    required: false
+    default: ''
+  test-pattern:
+    description: 'Regex pattern to pass to pytest -k'
+    required: false
+    default: ''
 
 runs:
   using: 'composite'
@@ -42,7 +43,7 @@ runs:
           --test-subdirs '${{ inputs.test-subdirs }}' \
           --test-pattern '${{ inputs.test-pattern }}' \
           --inference-mode '${{ inputs.inference-mode }}' \
-          ${{ inputs.run-vision-tests == 'true' && '--run-vision-tests' || '' }} \
+          --test-suite '${{ inputs.test-suite }}' \
           | tee pytest-${{ inputs.inference-mode }}.log
 
 
@@ -57,12 +58,7 @@ runs:
           echo "New recordings detected, committing and pushing"
           git add tests/integration/recordings/
 
-          if [ "${{ inputs.run-vision-tests }}" == "true" ]; then
-            git commit -m "Recordings update from CI (vision)"
-          else
-            git commit -m "Recordings update from CI"
-          fi
-
+          git commit -m "Recordings update from CI (test-suite: ${{ inputs.test-suite }})"
           git fetch origin ${{ github.ref_name }}
           git rebase origin/${{ github.ref_name }}
           echo "Rebased successfully"
diff --git a/.github/actions/setup-ollama/action.yml b/.github/actions/setup-ollama/action.yml
index e57876cb0..dc2f87e8c 100644
--- a/.github/actions/setup-ollama/action.yml
+++ b/.github/actions/setup-ollama/action.yml
@@ -1,17 +1,17 @@
 name: Setup Ollama
 description: Start Ollama
 inputs:
-  run-vision-tests:
-    description: 'Run vision tests: "true" or "false"'
+  test-suite:
+    description: 'Test suite to use: base, responses, vision, etc.'
     required: false
-    default: 'false'
+    default: ''
 runs:
   using: "composite"
   steps:
     - name: Start Ollama
       shell: bash
       run: |
-        if [ "${{ inputs.run-vision-tests }}" == "true" ]; then
+        if [ "${{ inputs.test-suite }}" == "vision" ]; then
           image="ollama-with-vision-model"
         else
           image="ollama-with-models"
diff --git a/.github/actions/setup-test-environment/action.yml b/.github/actions/setup-test-environment/action.yml
index d830e3d13..3be76f009 100644
--- a/.github/actions/setup-test-environment/action.yml
+++ b/.github/actions/setup-test-environment/action.yml
@@ -12,10 +12,10 @@ inputs:
     description: 'Provider to setup (ollama or vllm)'
     required: true
     default: 'ollama'
-  run-vision-tests:
-    description: 'Whether to setup provider for vision tests'
+  test-suite:
+    description: 'Test suite to use: base, responses, vision, etc.'
     required: false
-    default: 'false'
+    default: ''
   inference-mode:
     description: 'Inference mode (record or replay)'
     required: true
@@ -33,7 +33,7 @@ runs:
       if: ${{ inputs.provider == 'ollama' && inputs.inference-mode == 'record' }}
       uses: ./.github/actions/setup-ollama
       with:
-        run-vision-tests: ${{ inputs.run-vision-tests }}
+        test-suite: ${{ inputs.test-suite }}
 
     - name: Setup vllm
       if: ${{ inputs.provider == 'vllm' && inputs.inference-mode == 'record' }}
diff --git a/.github/workflows/README.md b/.github/workflows/README.md
index 8344d12a4..2e0df58b8 100644
--- a/.github/workflows/README.md
+++ b/.github/workflows/README.md
@@ -8,7 +8,7 @@ Llama Stack uses GitHub Actions for Continuous Integration (CI). Below is a tabl
 | Installer CI | [install-script-ci.yml](install-script-ci.yml) | Test the installation script |
 | Integration Auth Tests | [integration-auth-tests.yml](integration-auth-tests.yml) | Run the integration test suite with Kubernetes authentication |
 | SqlStore Integration Tests | [integration-sql-store-tests.yml](integration-sql-store-tests.yml) | Run the integration test suite with SqlStore |
-| Integration Tests (Replay) | [integration-tests.yml](integration-tests.yml) | Run the integration test suite from tests/integration in replay mode |
+| Integration Tests (Replay) | [integration-tests.yml](integration-tests.yml) | Run the integration test suites from tests/integration in replay mode |
 | Vector IO Integration Tests | [integration-vector-io-tests.yml](integration-vector-io-tests.yml) | Run the integration test suite with various VectorIO providers |
 | Pre-commit | [pre-commit.yml](pre-commit.yml) | Run pre-commit checks |
 | Test Llama Stack Build | [providers-build.yml](providers-build.yml) | Test llama stack build |
diff --git a/.github/workflows/integration-tests.yml b/.github/workflows/integration-tests.yml
index 57e582b20..bb53eea2f 100644
--- a/.github/workflows/integration-tests.yml
+++ b/.github/workflows/integration-tests.yml
@@ -1,6 +1,6 @@
 name: Integration Tests (Replay)
 
-run-name: Run the integration test suite from tests/integration in replay mode
+run-name: Run the integration test suites from tests/integration in replay mode
 
 on:
   push:
@@ -32,14 +32,6 @@ on:
         description: 'Test against a specific provider'
         type: string
         default: 'ollama'
-      test-subdirs:
-        description: 'Comma-separated list of test subdirectories to run'
-        type: string
-        default: ''
-      test-pattern:
-        description: 'Regex pattern to pass to pytest -k'
-        type: string
-        default: ''
 
 concurrency:
   # Skip concurrency for pushes to main - each commit should be tested independently
@@ -50,7 +42,7 @@ jobs:
 
   run-replay-mode-tests:
     runs-on: ubuntu-latest
-    name: ${{ format('Integration Tests ({0}, {1}, {2}, client={3}, vision={4})', matrix.client-type, matrix.provider, matrix.python-version, matrix.client-version, matrix.run-vision-tests) }}
+    name: ${{ format('Integration Tests ({0}, {1}, {2}, client={3}, {4})', matrix.client-type, matrix.provider, matrix.python-version, matrix.client-version, matrix.test-suite) }}
 
     strategy:
       fail-fast: false
@@ -61,7 +53,7 @@ jobs:
         # Use Python 3.13 only on nightly schedule (daily latest client test), otherwise use 3.12
         python-version: ${{ github.event.schedule == '0 0 * * *' && fromJSON('["3.12", "3.13"]') || fromJSON('["3.12"]') }}
         client-version: ${{ (github.event.schedule == '0 0 * * *' || github.event.inputs.test-all-client-versions == 'true') && fromJSON('["published", "latest"]') || fromJSON('["latest"]') }}
-        run-vision-tests: [true, false]
+        test-suite: [base, vision]
 
     steps:
       - name: Checkout repository
@@ -73,15 +65,13 @@ jobs:
           python-version: ${{ matrix.python-version }}
           client-version: ${{ matrix.client-version }}
           provider: ${{ matrix.provider }}
-          run-vision-tests: ${{ matrix.run-vision-tests }}
+          test-suite: ${{ matrix.test-suite }}
           inference-mode: 'replay'
 
       - name: Run tests
         uses: ./.github/actions/run-and-record-tests
         with:
-          test-subdirs: ${{ inputs.test-subdirs }}
-          test-pattern: ${{ inputs.test-pattern }}
           stack-config: ${{ matrix.client-type == 'library' && 'ci-tests' || 'server:ci-tests' }}
           provider: ${{ matrix.provider }}
           inference-mode: 'replay'
-          run-vision-tests: ${{ matrix.run-vision-tests }}
+          test-suite: ${{ matrix.test-suite }}
diff --git a/.github/workflows/record-integration-tests.yml b/.github/workflows/record-integration-tests.yml
index d4f5586e2..01797a54b 100644
--- a/.github/workflows/record-integration-tests.yml
+++ b/.github/workflows/record-integration-tests.yml
@@ -10,18 +10,18 @@ run-name: Run the integration test suite from tests/integration
 on:
   workflow_dispatch:
     inputs:
-      test-subdirs:
-        description: 'Comma-separated list of test subdirectories to run'
-        type: string
-        default: ''
       test-provider:
         description: 'Test against a specific provider'
         type: string
         default: 'ollama'
-      run-vision-tests:
-        description: 'Whether to run vision tests'
-        type: boolean
-        default: false
+      test-suite:
+        description: 'Test suite to use: base, responses, vision, etc.'
+        type: string
+        default: ''
+      test-subdirs:
+        description: 'Comma-separated list of test subdirectories to run; overrides test-suite'
+        type: string
+        default: ''
       test-pattern:
         description: 'Regex pattern to pass to pytest -k'
         type: string
@@ -38,11 +38,11 @@ jobs:
       - name: Echo workflow inputs
         run: |
           echo "::group::Workflow Inputs"
-          echo "test-subdirs: ${{ inputs.test-subdirs }}"
-          echo "test-provider: ${{ inputs.test-provider }}"
-          echo "run-vision-tests: ${{ inputs.run-vision-tests }}"
-          echo "test-pattern: ${{ inputs.test-pattern }}"
           echo "branch: ${{ github.ref_name }}"
+          echo "test-provider: ${{ inputs.test-provider }}"
+          echo "test-suite: ${{ inputs.test-suite }}"
+          echo "test-subdirs: ${{ inputs.test-subdirs }}"
+          echo "test-pattern: ${{ inputs.test-pattern }}"
           echo "::endgroup::"
 
       - name: Checkout repository
@@ -56,15 +56,15 @@ jobs:
           python-version: "3.12"  # Use single Python version for recording
           client-version: "latest"
           provider: ${{ inputs.test-provider || 'ollama' }}
-          run-vision-tests: ${{ inputs.run-vision-tests }}
+          test-suite: ${{ inputs.test-suite }}
           inference-mode: 'record'
 
       - name: Run and record tests
         uses: ./.github/actions/run-and-record-tests
         with:
-          test-pattern: ${{ inputs.test-pattern }}
-          test-subdirs: ${{ inputs.test-subdirs }}
           stack-config: 'server:ci-tests'  # recording must be done with server since more tests are run
           provider: ${{ inputs.test-provider || 'ollama' }}
           inference-mode: 'record'
-          run-vision-tests: ${{ inputs.run-vision-tests }}
+          test-suite: ${{ inputs.test-suite }}
+          test-subdirs: ${{ inputs.test-subdirs }}
+          test-pattern: ${{ inputs.test-pattern }}
diff --git a/scripts/github/schedule-record-workflow.sh b/scripts/github/schedule-record-workflow.sh
index e381b60b6..09e055611 100755
--- a/scripts/github/schedule-record-workflow.sh
+++ b/scripts/github/schedule-record-workflow.sh
@@ -15,7 +15,7 @@ set -euo pipefail
 BRANCH=""
 TEST_SUBDIRS=""
 TEST_PROVIDER="ollama"
-RUN_VISION_TESTS=false
+TEST_SUITE="base"
 TEST_PATTERN=""
 
 # Help function
@@ -27,9 +27,9 @@ Trigger the integration test recording workflow remotely. This way you do not ne
 
 OPTIONS:
     -b, --branch BRANCH         Branch to run the workflow on (defaults to current branch)
-    -s, --test-subdirs DIRS     Comma-separated list of test subdirectories to run (REQUIRED)
     -p, --test-provider PROVIDER Test provider to use: vllm or ollama (default: ollama)
-    -v, --run-vision-tests      Include vision tests in the recording
+    -t, --test-suite SUITE      Test suite to use: base, responses, vision, etc. (default: base)
+    -s, --test-subdirs DIRS     Comma-separated list of test subdirectories to run (overrides suite)
     -k, --test-pattern PATTERN  Regex pattern to pass to pytest -k
     -h, --help                  Show this help message
 
@@ -38,7 +38,7 @@ EXAMPLES:
     $0 --test-subdirs "agents"
 
     # Record tests for specific branch with vision tests
-    $0 -b my-feature-branch --test-subdirs "inference" --run-vision-tests
+    $0 -b my-feature-branch --test-suite vision
 
     # Record multiple test subdirectories with specific provider
     $0 --test-subdirs "agents,inference" --test-provider vllm
@@ -71,9 +71,9 @@ while [[ $# -gt 0 ]]; do
             TEST_PROVIDER="$2"
             shift 2
             ;;
-        -v|--run-vision-tests)
-            RUN_VISION_TESTS=true
-            shift
+        -t|--test-suite)
+            TEST_SUITE="$2"
+            shift 2
             ;;
         -k|--test-pattern)
             TEST_PATTERN="$2"
@@ -92,11 +92,11 @@ while [[ $# -gt 0 ]]; do
 done
 
 # Validate required parameters
-if [[ -z "$TEST_SUBDIRS" ]]; then
-    echo "Error: --test-subdirs is required"
-    echo "Please specify which test subdirectories to run, e.g.:"
+if [[ -z "$TEST_SUBDIRS" && -z "$TEST_SUITE" ]]; then
+    echo "Error: --test-subdirs or --test-suite is required"
+    echo "Please specify which test subdirectories to run or test suite to use, e.g.:"
     echo "  $0 --test-subdirs \"agents,inference\""
-    echo "  $0 --test-subdirs \"inference\" --run-vision-tests"
+    echo "  $0 --test-suite vision"
     echo ""
     exit 1
 fi
@@ -239,17 +239,19 @@ echo "Triggering integration test recording workflow..."
 echo "Branch: $BRANCH"
 echo "Test provider: $TEST_PROVIDER"
 echo "Test subdirs: $TEST_SUBDIRS"
-echo "Run vision tests: $RUN_VISION_TESTS"
+echo "Test suite: $TEST_SUITE"
 echo "Test pattern: ${TEST_PATTERN:-"(none)"}"
 echo ""
 
 # Prepare inputs for gh workflow run
-INPUTS="-f test-subdirs='$TEST_SUBDIRS'"
+if [[ -n "$TEST_SUBDIRS" ]]; then
+    INPUTS="-f test-subdirs='$TEST_SUBDIRS'"
+fi
 if [[ -n "$TEST_PROVIDER" ]]; then
     INPUTS="$INPUTS -f test-provider='$TEST_PROVIDER'"
 fi
-if [[ "$RUN_VISION_TESTS" == "true" ]]; then
-    INPUTS="$INPUTS -f run-vision-tests=true"
+if [[ -n "$TEST_SUITE" ]]; then
+    INPUTS="$INPUTS -f test-suite='$TEST_SUITE'"
 fi
 if [[ -n "$TEST_PATTERN" ]]; then
     INPUTS="$INPUTS -f test-pattern='$TEST_PATTERN'"
diff --git a/scripts/integration-tests.sh b/scripts/integration-tests.sh
index 104ba5cf3..ab7e37579 100755
--- a/scripts/integration-tests.sh
+++ b/scripts/integration-tests.sh
@@ -16,7 +16,7 @@ STACK_CONFIG=""
 PROVIDER=""
 TEST_SUBDIRS=""
 TEST_PATTERN=""
-RUN_VISION_TESTS="false"
+TEST_SUITE="base"
 INFERENCE_MODE="replay"
 EXTRA_PARAMS=""
 
@@ -28,12 +28,16 @@ Usage: $0 [OPTIONS]
 Options:
     --stack-config STRING    Stack configuration to use (required)
     --provider STRING        Provider to use (ollama, vllm, etc.) (required)
-    --test-subdirs STRING    Comma-separated list of test subdirectories to run (default: 'inference')
-    --run-vision-tests       Run vision tests instead of regular tests
+    --test-suite STRING      Comma-separated list of test suites to run (default: 'base')
     --inference-mode STRING  Inference mode: record or replay (default: replay)
+    --test-subdirs STRING    Comma-separated list of test subdirectories to run (overrides suite)
     --test-pattern STRING    Regex pattern to pass to pytest -k
     --help                   Show this help message
 
+Suites are defined in tests/integration/suites.py. They are used to narrow the collection of tests and provide default model options.
+
+You can also specify subdirectories (of tests/integration) to select tests from, which will override the suite.
+
 Examples:
     # Basic inference tests with ollama
     $0 --stack-config server:ci-tests --provider ollama
@@ -42,7 +46,7 @@ Examples:
     $0 --stack-config server:ci-tests --provider vllm --test-subdirs 'inference,agents'
 
     # Vision tests with ollama
-    $0 --stack-config server:ci-tests --provider ollama --run-vision-tests
+    $0 --stack-config server:ci-tests --provider ollama --test-suite vision
 
     # Record mode for updating test recordings
     $0 --stack-config server:ci-tests --provider ollama --inference-mode record
@@ -64,9 +68,9 @@ while [[ $# -gt 0 ]]; do
             TEST_SUBDIRS="$2"
             shift 2
             ;;
-        --run-vision-tests)
-            RUN_VISION_TESTS="true"
-            shift
+        --test-suite)
+            TEST_SUITE="$2"
+            shift 2
             ;;
         --inference-mode)
             INFERENCE_MODE="$2"
@@ -92,22 +96,25 @@ done
 # Validate required parameters
 if [[ -z "$STACK_CONFIG" ]]; then
     echo "Error: --stack-config is required"
-    usage
     exit 1
 fi
 
 if [[ -z "$PROVIDER" ]]; then
     echo "Error: --provider is required"
-    usage
+    exit 1
+fi
+
+if [[ -z "$TEST_SUITE" && -z "$TEST_SUBDIRS" ]]; then
+    echo "Error: --test-suite or --test-subdirs is required"
     exit 1
 fi
 
 echo "=== Llama Stack Integration Test Runner ==="
 echo "Stack Config: $STACK_CONFIG"
 echo "Provider: $PROVIDER"
-echo "Test Subdirs: $TEST_SUBDIRS"
-echo "Vision Tests: $RUN_VISION_TESTS"
 echo "Inference Mode: $INFERENCE_MODE"
+echo "Test Suite: $TEST_SUITE"
+echo "Test Subdirs: $TEST_SUBDIRS"
 echo "Test Pattern: $TEST_PATTERN"
 echo ""
 
@@ -194,84 +201,46 @@ if [[ -n "$TEST_PATTERN" ]]; then
     PYTEST_PATTERN="${PYTEST_PATTERN} and $TEST_PATTERN"
 fi
 
-# Run vision tests if specified
-if [[ "$RUN_VISION_TESTS" == "true" ]]; then
-    echo "Running vision tests..."
-    set +e
-    pytest -s -v tests/integration/inference/test_vision_inference.py \
-        --stack-config="$STACK_CONFIG" \
-        -k "$PYTEST_PATTERN" \
-        --vision-model=ollama/llama3.2-vision:11b \
-        --embedding-model=sentence-transformers/all-MiniLM-L6-v2 \
-        --color=yes $EXTRA_PARAMS \
-        --capture=tee-sys
-    exit_code=$?
-    set -e
-
-    if [ $exit_code -eq 0 ]; then
-        echo "✅ Vision tests completed successfully"
-    elif [ $exit_code -eq 5 ]; then
-        echo "⚠️ No vision tests collected (pattern matched no tests)"
-    else
-        echo "❌ Vision tests failed"
-        exit 1
-    fi
-    exit 0
-fi
-
-# Run regular tests
-if [[ -z "$TEST_SUBDIRS" ]]; then
-   TEST_SUBDIRS=$(find tests/integration -maxdepth 1 -mindepth 1 -type d |
-            sed 's|tests/integration/||' |
-            grep -Ev "^(__pycache__|fixtures|test_cases|recordings|non_ci|post_training)$" |
-            sort)
-fi
 echo "Test subdirs to run: $TEST_SUBDIRS"
 
-# Collect all test files for the specified test types
-TEST_FILES=""
-for test_subdir in $(echo "$TEST_SUBDIRS" | tr ',' '\n'); do
-    # Skip certain test types for vllm provider
-    if [[ "$PROVIDER" == "vllm" ]]; then
-        if [[ "$test_subdir" == "safety" ]] || [[ "$test_subdir" == "post_training" ]] || [[ "$test_subdir" == "tool_runtime" ]]; then
-            echo "Skipping $test_subdir for vllm provider"
-            continue
+if [[ -n "$TEST_SUBDIRS" ]]; then
+    # Collect all test files for the specified test types
+    TEST_FILES=""
+    for test_subdir in $(echo "$TEST_SUBDIRS" | tr ',' '\n'); do
+        if [[ -d "tests/integration/$test_subdir" ]]; then
+            # Find all Python test files in this directory
+            test_files=$(find tests/integration/$test_subdir -name "test_*.py" -o -name "*_test.py")
+            if [[ -n "$test_files" ]]; then
+                TEST_FILES="$TEST_FILES $test_files"
+                echo "Added test files from $test_subdir: $(echo $test_files | wc -w) files"
+            fi
+        else
+            echo "Warning: Directory tests/integration/$test_subdir does not exist"
         fi
+    done
+
+    if [[ -z "$TEST_FILES" ]]; then
+        echo "No test files found for the specified test types"
+        exit 1
     fi
 
-    if [[ "$STACK_CONFIG" != *"server:"* ]] && [[ "$test_subdir" == "batches" ]]; then
-        echo "Skipping $test_subdir for library client until types are supported"
-        continue
-    fi
+    echo ""
+    echo "=== Running all collected tests in a single pytest command ==="
+    echo "Total test files: $(echo $TEST_FILES | wc -w)"
 
-    if [[ -d "tests/integration/$test_subdir" ]]; then
-        # Find all Python test files in this directory
-        test_files=$(find tests/integration/$test_subdir -name "test_*.py" -o -name "*_test.py")
-        if [[ -n "$test_files" ]]; then
-            TEST_FILES="$TEST_FILES $test_files"
-            echo "Added test files from $test_subdir: $(echo $test_files | wc -w) files"
-        fi
-    else
-        echo "Warning: Directory tests/integration/$test_subdir does not exist"
-    fi
-done
-
-if [[ -z "$TEST_FILES" ]]; then
-    echo "No test files found for the specified test types"
-    exit 1
+    PYTEST_TARGET="$TEST_FILES"
+    EXTRA_PARAMS="$EXTRA_PARAMS --text-model=$TEXT_MODEL --embedding-model=sentence-transformers/all-MiniLM-L6-v2"
+else
+    PYTEST_TARGET="tests/integration/"
+    EXTRA_PARAMS="$EXTRA_PARAMS --suite=$TEST_SUITE"
 fi
 
-echo ""
-echo "=== Running all collected tests in a single pytest command ==="
-echo "Total test files: $(echo $TEST_FILES | wc -w)"
-
 set +e
-pytest -s -v $TEST_FILES \
+pytest -s -v $PYTEST_TARGET \
     --stack-config="$STACK_CONFIG" \
     -k "$PYTEST_PATTERN" \
-    --text-model="$TEXT_MODEL" \
-    --embedding-model=sentence-transformers/all-MiniLM-L6-v2 \
-    --color=yes $EXTRA_PARAMS \
+    $EXTRA_PARAMS \
+    --color=yes \
     --capture=tee-sys
 exit_code=$?
 set -e
@@ -294,7 +263,13 @@ df -h
 # stop server
 if [[ "$STACK_CONFIG" == *"server:"* ]]; then
     echo "Stopping Llama Stack Server..."
-    kill $(lsof -i :8321 | awk 'NR>1 {print $2}')
+    pids=$(lsof -i :8321 | awk 'NR>1 {print $2}')
+    if [[ -n "$pids" ]]; then
+        echo "Killing Llama Stack Server processes: $pids"
+        kill -9 $pids
+    else
+        echo "No Llama Stack Server processes found ?!"
+    fi
     echo "Llama Stack Server stopped"
 fi
 
diff --git a/tests/README.md b/tests/README.md
index 81f025f86..c00829d3e 100644
--- a/tests/README.md
+++ b/tests/README.md
@@ -77,7 +77,7 @@ You must be careful when re-recording. CI workflows assume a specific setup for
 ./scripts/github/schedule-record-workflow.sh --test-subdirs "agents,inference"
 
 # Record with vision tests enabled
-./scripts/github/schedule-record-workflow.sh --test-subdirs "inference" --run-vision-tests
+./scripts/github/schedule-record-workflow.sh --test-suite vision
 
 # Record with specific provider
 ./scripts/github/schedule-record-workflow.sh --test-subdirs "agents" --test-provider vllm
diff --git a/tests/integration/README.md b/tests/integration/README.md
index d177cbebf..b05beeb98 100644
--- a/tests/integration/README.md
+++ b/tests/integration/README.md
@@ -42,6 +42,27 @@ Model parameters can be influenced by the following options:
 Each of these are comma-separated lists and can be used to generate multiple parameter combinations. Note that tests will be skipped
 if no model is specified.
 
+### Suites (fast selection + sane defaults)
+
+- `--suite`: comma-separated list of named suites that both narrow which tests are collected and prefill common model options (unless you pass them explicitly).
+- Available suites:
+  - `responses`: collects tests under `tests/integration/responses`; this is a separate suite because it needs a strong tool-calling model.
+  - `vision`: collects only `tests/integration/inference/test_vision_inference.py`; defaults `--vision-model=ollama/llama3.2-vision:11b`, `--embedding-model=sentence-transformers/all-MiniLM-L6-v2`.
+- Explicit flags always win. For example, `--suite=responses --text-model=<X>` overrides the suite’s text model.
+
+Examples:
+
+```bash
+# Fast responses run with defaults
+pytest -s -v tests/integration --stack-config=server:starter --suite=responses
+
+# Fast single-file vision run with defaults
+pytest -s -v tests/integration --stack-config=server:starter --suite=vision
+
+# Combine suites and override a default
+pytest -s -v tests/integration --stack-config=server:starter --suite=responses,vision --embedding-model=text-embedding-3-small
+```
+
 ## Examples
 
 ### Testing against a Server
diff --git a/tests/integration/conftest.py b/tests/integration/conftest.py
index fd9a54d04..96260fdb7 100644
--- a/tests/integration/conftest.py
+++ b/tests/integration/conftest.py
@@ -6,15 +6,17 @@
 import inspect
 import itertools
 import os
-import platform
 import textwrap
 import time
+from pathlib import Path
 
 import pytest
 from dotenv import load_dotenv
 
 from llama_stack.log import get_logger
 
+from .suites import SUITE_DEFINITIONS
+
 logger = get_logger(__name__, category="tests")
 
 
@@ -61,9 +63,22 @@ def pytest_configure(config):
         key, value = env_var.split("=", 1)
         os.environ[key] = value
 
-    if platform.system() == "Darwin":  # Darwin is the system name for macOS
-        os.environ["DISABLE_CODE_SANDBOX"] = "1"
-        logger.info("Setting DISABLE_CODE_SANDBOX=1 for macOS")
+    suites_raw = config.getoption("--suite")
+    suites: list[str] = []
+    if suites_raw:
+        suites = [p.strip() for p in str(suites_raw).split(",") if p.strip()]
+        unknown = [p for p in suites if p not in SUITE_DEFINITIONS]
+        if unknown:
+            raise pytest.UsageError(
+                f"Unknown suite(s): {', '.join(unknown)}. Available: {', '.join(sorted(SUITE_DEFINITIONS.keys()))}"
+            )
+    for suite in suites:
+        suite_def = SUITE_DEFINITIONS.get(suite, {})
+        defaults: dict = suite_def.get("defaults", {})
+        for dest, value in defaults.items():
+            current = getattr(config.option, dest, None)
+            if not current:
+                setattr(config.option, dest, value)
 
 
 def pytest_addoption(parser):
@@ -105,16 +120,21 @@ def pytest_addoption(parser):
         default=384,
         help="Output dimensionality of the embedding model to use for testing. Default: 384",
     )
-    parser.addoption(
-        "--record-responses",
-        action="store_true",
-        help="Record new API responses instead of using cached ones.",
-    )
     parser.addoption(
         "--report",
         help="Path where the test report should be written, e.g. --report=/path/to/report.md",
     )
 
+    available_suites = ", ".join(sorted(SUITE_DEFINITIONS.keys()))
+    suite_help = (
+        "Comma-separated integration test suites to narrow collection and prefill defaults. "
+        "Available: "
+        f"{available_suites}. "
+        "Explicit CLI flags (e.g., --text-model) override suite defaults. "
+        "Examples: --suite=responses or --suite=responses,vision."
+    )
+    parser.addoption("--suite", help=suite_help)
+
 
 MODEL_SHORT_IDS = {
     "meta-llama/Llama-3.2-3B-Instruct": "3B",
@@ -197,3 +217,40 @@ def pytest_generate_tests(metafunc):
 
 
 pytest_plugins = ["tests.integration.fixtures.common"]
+
+
+def pytest_ignore_collect(path: str, config: pytest.Config) -> bool:
+    """Skip collecting paths outside the selected suite roots for speed."""
+    suites_raw = config.getoption("--suite")
+    if not suites_raw:
+        return False
+
+    names = [p.strip() for p in str(suites_raw).split(",") if p.strip()]
+    roots: list[str] = []
+    for name in names:
+        suite_def = SUITE_DEFINITIONS.get(name)
+        if suite_def:
+            roots.extend(suite_def.get("roots", []))
+    if not roots:
+        return False
+
+    p = Path(str(path)).resolve()
+
+    # Only constrain within tests/integration to avoid ignoring unrelated tests
+    integration_root = (Path(str(config.rootpath)) / "tests" / "integration").resolve()
+    if not p.is_relative_to(integration_root):
+        return False
+
+    for r in roots:
+        rp = (Path(str(config.rootpath)) / r).resolve()
+        if rp.is_file():
+            # Allow the exact file and any ancestor directories so pytest can walk into it.
+            if p == rp:
+                return False
+            if p.is_dir() and rp.is_relative_to(p):
+                return False
+        else:
+            # Allow anything inside an allowed directory
+            if p.is_relative_to(rp):
+                return False
+    return True
diff --git a/tests/integration/non_ci/responses/__init__.py b/tests/integration/responses/__init__.py
similarity index 100%
rename from tests/integration/non_ci/responses/__init__.py
rename to tests/integration/responses/__init__.py
diff --git a/tests/integration/non_ci/responses/fixtures/__init__.py b/tests/integration/responses/fixtures/__init__.py
similarity index 100%
rename from tests/integration/non_ci/responses/fixtures/__init__.py
rename to tests/integration/responses/fixtures/__init__.py
diff --git a/tests/integration/non_ci/responses/fixtures/fixtures.py b/tests/integration/responses/fixtures/fixtures.py
similarity index 100%
rename from tests/integration/non_ci/responses/fixtures/fixtures.py
rename to tests/integration/responses/fixtures/fixtures.py
diff --git a/tests/integration/non_ci/responses/fixtures/images/vision_test_1.jpg b/tests/integration/responses/fixtures/images/vision_test_1.jpg
similarity index 100%
rename from tests/integration/non_ci/responses/fixtures/images/vision_test_1.jpg
rename to tests/integration/responses/fixtures/images/vision_test_1.jpg
diff --git a/tests/integration/non_ci/responses/fixtures/images/vision_test_2.jpg b/tests/integration/responses/fixtures/images/vision_test_2.jpg
similarity index 100%
rename from tests/integration/non_ci/responses/fixtures/images/vision_test_2.jpg
rename to tests/integration/responses/fixtures/images/vision_test_2.jpg
diff --git a/tests/integration/non_ci/responses/fixtures/images/vision_test_3.jpg b/tests/integration/responses/fixtures/images/vision_test_3.jpg
similarity index 100%
rename from tests/integration/non_ci/responses/fixtures/images/vision_test_3.jpg
rename to tests/integration/responses/fixtures/images/vision_test_3.jpg
diff --git a/tests/integration/non_ci/responses/fixtures/pdfs/llama_stack_and_models.pdf b/tests/integration/responses/fixtures/pdfs/llama_stack_and_models.pdf
similarity index 100%
rename from tests/integration/non_ci/responses/fixtures/pdfs/llama_stack_and_models.pdf
rename to tests/integration/responses/fixtures/pdfs/llama_stack_and_models.pdf
diff --git a/tests/integration/non_ci/responses/fixtures/test_cases.py b/tests/integration/responses/fixtures/test_cases.py
similarity index 100%
rename from tests/integration/non_ci/responses/fixtures/test_cases.py
rename to tests/integration/responses/fixtures/test_cases.py
diff --git a/tests/integration/non_ci/responses/helpers.py b/tests/integration/responses/helpers.py
similarity index 100%
rename from tests/integration/non_ci/responses/helpers.py
rename to tests/integration/responses/helpers.py
diff --git a/tests/integration/non_ci/responses/streaming_assertions.py b/tests/integration/responses/streaming_assertions.py
similarity index 100%
rename from tests/integration/non_ci/responses/streaming_assertions.py
rename to tests/integration/responses/streaming_assertions.py
diff --git a/tests/integration/non_ci/responses/test_basic_responses.py b/tests/integration/responses/test_basic_responses.py
similarity index 100%
rename from tests/integration/non_ci/responses/test_basic_responses.py
rename to tests/integration/responses/test_basic_responses.py
diff --git a/tests/integration/non_ci/responses/test_file_search.py b/tests/integration/responses/test_file_search.py
similarity index 100%
rename from tests/integration/non_ci/responses/test_file_search.py
rename to tests/integration/responses/test_file_search.py
diff --git a/tests/integration/non_ci/responses/test_tool_responses.py b/tests/integration/responses/test_tool_responses.py
similarity index 100%
rename from tests/integration/non_ci/responses/test_tool_responses.py
rename to tests/integration/responses/test_tool_responses.py
diff --git a/tests/integration/suites.py b/tests/integration/suites.py
new file mode 100644
index 000000000..602855055
--- /dev/null
+++ b/tests/integration/suites.py
@@ -0,0 +1,53 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+# Central definition of integration test suites. You can use these suites by passing --suite=name to pytest.
+# For example:
+#
+# ```bash
+# pytest tests/integration/ --suite=vision
+# ```
+#
+# Each suite can:
+# - restrict collection to specific roots (dirs or files)
+# - provide default CLI option values (e.g. text_model, embedding_model, etc.)
+
+from pathlib import Path
+
+this_dir = Path(__file__).parent
+default_roots = [
+    str(p)
+    for p in this_dir.glob("*")
+    if p.is_dir()
+    and p.name not in ("__pycache__", "fixtures", "test_cases", "recordings", "responses", "post_training")
+]
+
+SUITE_DEFINITIONS: dict[str, dict] = {
+    "base": {
+        "description": "Base suite that includes most tests but runs them with a text Ollama model",
+        "roots": default_roots,
+        "defaults": {
+            "text_model": "ollama/llama3.2:3b-instruct-fp16",
+            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
+        },
+    },
+    "responses": {
+        "description": "Suite that includes only the OpenAI Responses tests; needs a strong tool-calling model",
+        "roots": ["tests/integration/responses"],
+        "defaults": {
+            "text_model": "openai/gpt-4o",
+            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
+        },
+    },
+    "vision": {
+        "description": "Suite that includes only the vision tests",
+        "roots": ["tests/integration/inference/test_vision_inference.py"],
+        "defaults": {
+            "vision_model": "ollama/llama3.2-vision:11b",
+            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
+        },
+    },
+}

From 7cd1c2c238969cb41ddb3d87b7dcfe5331350be1 Mon Sep 17 00:00:00 2001
From: Francisco Arceo <arceofrancisco@gmail.com>
Date: Sat, 6 Sep 2025 07:26:34 -0600
Subject: [PATCH 21/76] feat: Updating Rag Tool to use Files API and Vector
 Stores API (#3344)

---
 docs/source/getting_started/demo_script.py    |  5 +-
 .../inline/tool_runtime/rag/__init__.py       |  2 +-
 .../inline/tool_runtime/rag/memory.py         | 74 ++++++++++++++-----
 .../providers/registry/tool_runtime.py        |  2 +-
 .../integration/tool_runtime/test_rag_tool.py | 41 ++++++----
 tests/unit/rag/test_rag_query.py              |  8 +-
 6 files changed, 93 insertions(+), 39 deletions(-)

diff --git a/docs/source/getting_started/demo_script.py b/docs/source/getting_started/demo_script.py
index 777fc78c2..2ea67739f 100644
--- a/docs/source/getting_started/demo_script.py
+++ b/docs/source/getting_started/demo_script.py
@@ -18,12 +18,13 @@ embedding_model_id = (
 ).identifier
 embedding_dimension = em.metadata["embedding_dimension"]
 
-_ = client.vector_dbs.register(
+vector_db = client.vector_dbs.register(
     vector_db_id=vector_db_id,
     embedding_model=embedding_model_id,
     embedding_dimension=embedding_dimension,
     provider_id="faiss",
 )
+vector_db_id = vector_db.identifier
 source = "https://www.paulgraham.com/greatwork.html"
 print("rag_tool> Ingesting document:", source)
 document = RAGDocument(
@@ -35,7 +36,7 @@ document = RAGDocument(
 client.tool_runtime.rag_tool.insert(
     documents=[document],
     vector_db_id=vector_db_id,
-    chunk_size_in_tokens=50,
+    chunk_size_in_tokens=100,
 )
 agent = Agent(
     client,
diff --git a/llama_stack/providers/inline/tool_runtime/rag/__init__.py b/llama_stack/providers/inline/tool_runtime/rag/__init__.py
index f9a6e5c55..f9a7e7b89 100644
--- a/llama_stack/providers/inline/tool_runtime/rag/__init__.py
+++ b/llama_stack/providers/inline/tool_runtime/rag/__init__.py
@@ -14,6 +14,6 @@ from .config import RagToolRuntimeConfig
 async def get_provider_impl(config: RagToolRuntimeConfig, deps: dict[Api, Any]):
     from .memory import MemoryToolRuntimeImpl
 
-    impl = MemoryToolRuntimeImpl(config, deps[Api.vector_io], deps[Api.inference])
+    impl = MemoryToolRuntimeImpl(config, deps[Api.vector_io], deps[Api.inference], deps[Api.files])
     await impl.initialize()
     return impl
diff --git a/llama_stack/providers/inline/tool_runtime/rag/memory.py b/llama_stack/providers/inline/tool_runtime/rag/memory.py
index a1543457b..cb526e8ee 100644
--- a/llama_stack/providers/inline/tool_runtime/rag/memory.py
+++ b/llama_stack/providers/inline/tool_runtime/rag/memory.py
@@ -5,10 +5,15 @@
 # the root directory of this source tree.
 
 import asyncio
+import base64
+import io
+import mimetypes
 import secrets
 import string
 from typing import Any
 
+import httpx
+from fastapi import UploadFile
 from pydantic import TypeAdapter
 
 from llama_stack.apis.common.content_types import (
@@ -17,6 +22,7 @@ from llama_stack.apis.common.content_types import (
     InterleavedContentItem,
     TextContentItem,
 )
+from llama_stack.apis.files import Files, OpenAIFilePurpose
 from llama_stack.apis.inference import Inference
 from llama_stack.apis.tools import (
     ListToolDefsResponse,
@@ -30,13 +36,18 @@ from llama_stack.apis.tools import (
     ToolParameter,
     ToolRuntime,
 )
-from llama_stack.apis.vector_io import QueryChunksResponse, VectorIO
+from llama_stack.apis.vector_io import (
+    QueryChunksResponse,
+    VectorIO,
+    VectorStoreChunkingStrategyStatic,
+    VectorStoreChunkingStrategyStaticConfig,
+)
 from llama_stack.log import get_logger
 from llama_stack.providers.datatypes import ToolGroupsProtocolPrivate
 from llama_stack.providers.utils.inference.prompt_adapter import interleaved_content_as_str
 from llama_stack.providers.utils.memory.vector_store import (
     content_from_doc,
-    make_overlapped_chunks,
+    parse_data_url,
 )
 
 from .config import RagToolRuntimeConfig
@@ -55,10 +66,12 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
         config: RagToolRuntimeConfig,
         vector_io_api: VectorIO,
         inference_api: Inference,
+        files_api: Files,
     ):
         self.config = config
         self.vector_io_api = vector_io_api
         self.inference_api = inference_api
+        self.files_api = files_api
 
     async def initialize(self):
         pass
@@ -78,27 +91,50 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
         vector_db_id: str,
         chunk_size_in_tokens: int = 512,
     ) -> None:
-        chunks = []
+        if not documents:
+            return
+
         for doc in documents:
-            content = await content_from_doc(doc)
-            # TODO: we should add enrichment here as URLs won't be added to the metadata by default
-            chunks.extend(
-                make_overlapped_chunks(
-                    doc.document_id,
-                    content,
-                    chunk_size_in_tokens,
-                    chunk_size_in_tokens // 4,
-                    doc.metadata,
+            if isinstance(doc.content, URL):
+                if doc.content.uri.startswith("data:"):
+                    parts = parse_data_url(doc.content.uri)
+                    file_data = base64.b64decode(parts["data"]) if parts["is_base64"] else parts["data"].encode()
+                    mime_type = parts["mimetype"]
+                else:
+                    async with httpx.AsyncClient() as client:
+                        response = await client.get(doc.content.uri)
+                        file_data = response.content
+                        mime_type = doc.mime_type or response.headers.get("content-type", "application/octet-stream")
+            else:
+                content_str = await content_from_doc(doc)
+                file_data = content_str.encode("utf-8")
+                mime_type = doc.mime_type or "text/plain"
+
+            file_extension = mimetypes.guess_extension(mime_type) or ".txt"
+            filename = doc.metadata.get("filename", f"{doc.document_id}{file_extension}")
+
+            file_obj = io.BytesIO(file_data)
+            file_obj.name = filename
+
+            upload_file = UploadFile(file=file_obj, filename=filename)
+
+            created_file = await self.files_api.openai_upload_file(
+                file=upload_file, purpose=OpenAIFilePurpose.ASSISTANTS
+            )
+
+            chunking_strategy = VectorStoreChunkingStrategyStatic(
+                static=VectorStoreChunkingStrategyStaticConfig(
+                    max_chunk_size_tokens=chunk_size_in_tokens,
+                    chunk_overlap_tokens=chunk_size_in_tokens // 4,
                 )
             )
 
-        if not chunks:
-            return
-
-        await self.vector_io_api.insert_chunks(
-            chunks=chunks,
-            vector_db_id=vector_db_id,
-        )
+            await self.vector_io_api.openai_attach_file_to_vector_store(
+                vector_store_id=vector_db_id,
+                file_id=created_file.id,
+                attributes=doc.metadata,
+                chunking_strategy=chunking_strategy,
+            )
 
     async def query(
         self,
diff --git a/llama_stack/providers/registry/tool_runtime.py b/llama_stack/providers/registry/tool_runtime.py
index 661851443..5a58fa7af 100644
--- a/llama_stack/providers/registry/tool_runtime.py
+++ b/llama_stack/providers/registry/tool_runtime.py
@@ -32,7 +32,7 @@ def available_providers() -> list[ProviderSpec]:
             ],
             module="llama_stack.providers.inline.tool_runtime.rag",
             config_class="llama_stack.providers.inline.tool_runtime.rag.config.RagToolRuntimeConfig",
-            api_dependencies=[Api.vector_io, Api.inference],
+            api_dependencies=[Api.vector_io, Api.inference, Api.files],
             description="RAG (Retrieval-Augmented Generation) tool runtime for document ingestion, chunking, and semantic search.",
         ),
         remote_provider_spec(
diff --git a/tests/integration/tool_runtime/test_rag_tool.py b/tests/integration/tool_runtime/test_rag_tool.py
index 2affe2a2d..b208500d8 100644
--- a/tests/integration/tool_runtime/test_rag_tool.py
+++ b/tests/integration/tool_runtime/test_rag_tool.py
@@ -17,10 +17,14 @@ def client_with_empty_registry(client_with_models):
             client_with_models.vector_dbs.unregister(vector_db_id=vector_db_id)
 
     clear_registry()
+
+    try:
+        client_with_models.toolgroups.register(toolgroup_id="builtin::rag", provider_id="rag-runtime")
+    except Exception:
+        pass
+
     yield client_with_models
 
-    # you must clean after the last test if you were running tests against
-    # a stateful server instance
     clear_registry()
 
 
@@ -66,12 +70,13 @@ def assert_valid_text_response(response):
 def test_vector_db_insert_inline_and_query(
     client_with_empty_registry, sample_documents, embedding_model_id, embedding_dimension
 ):
-    vector_db_id = "test_vector_db"
-    client_with_empty_registry.vector_dbs.register(
-        vector_db_id=vector_db_id,
+    vector_db_name = "test_vector_db"
+    vector_db = client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_name,
         embedding_model=embedding_model_id,
         embedding_dimension=embedding_dimension,
     )
+    vector_db_id = vector_db.identifier
 
     client_with_empty_registry.tool_runtime.rag_tool.insert(
         documents=sample_documents,
@@ -134,7 +139,11 @@ def test_vector_db_insert_from_url_and_query(
 
     # list to check memory bank is successfully registered
     available_vector_dbs = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
-    assert vector_db_id in available_vector_dbs
+    # VectorDB is being migrated to VectorStore, so the ID will be different
+    # Just check that at least one vector DB was registered
+    assert len(available_vector_dbs) > 0
+    # Use the actual registered vector_db_id for subsequent operations
+    actual_vector_db_id = available_vector_dbs[0]
 
     urls = [
         "memory_optimizations.rst",
@@ -153,13 +162,13 @@ def test_vector_db_insert_from_url_and_query(
 
     client_with_empty_registry.tool_runtime.rag_tool.insert(
         documents=documents,
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         chunk_size_in_tokens=512,
     )
 
     # Query for the name of method
     response1 = client_with_empty_registry.vector_io.query(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         query="What's the name of the fine-tunning method used?",
     )
     assert_valid_chunk_response(response1)
@@ -167,7 +176,7 @@ def test_vector_db_insert_from_url_and_query(
 
     # Query for the name of model
     response2 = client_with_empty_registry.vector_io.query(
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         query="Which Llama model is mentioned?",
     )
     assert_valid_chunk_response(response2)
@@ -187,7 +196,11 @@ def test_rag_tool_insert_and_query(client_with_empty_registry, embedding_model_i
     )
 
     available_vector_dbs = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
-    assert vector_db_id in available_vector_dbs
+    # VectorDB is being migrated to VectorStore, so the ID will be different
+    # Just check that at least one vector DB was registered
+    assert len(available_vector_dbs) > 0
+    # Use the actual registered vector_db_id for subsequent operations
+    actual_vector_db_id = available_vector_dbs[0]
 
     urls = [
         "memory_optimizations.rst",
@@ -206,19 +219,19 @@ def test_rag_tool_insert_and_query(client_with_empty_registry, embedding_model_i
 
     client_with_empty_registry.tool_runtime.rag_tool.insert(
         documents=documents,
-        vector_db_id=vector_db_id,
+        vector_db_id=actual_vector_db_id,
         chunk_size_in_tokens=512,
     )
 
     response_with_metadata = client_with_empty_registry.tool_runtime.rag_tool.query(
-        vector_db_ids=[vector_db_id],
+        vector_db_ids=[actual_vector_db_id],
         content="What is the name of the method used for fine-tuning?",
     )
     assert_valid_text_response(response_with_metadata)
     assert any("metadata:" in chunk.text.lower() for chunk in response_with_metadata.content)
 
     response_without_metadata = client_with_empty_registry.tool_runtime.rag_tool.query(
-        vector_db_ids=[vector_db_id],
+        vector_db_ids=[actual_vector_db_id],
         content="What is the name of the method used for fine-tuning?",
         query_config={
             "include_metadata_in_content": True,
@@ -230,7 +243,7 @@ def test_rag_tool_insert_and_query(client_with_empty_registry, embedding_model_i
 
     with pytest.raises((ValueError, BadRequestError)):
         client_with_empty_registry.tool_runtime.rag_tool.query(
-            vector_db_ids=[vector_db_id],
+            vector_db_ids=[actual_vector_db_id],
             content="What is the name of the method used for fine-tuning?",
             query_config={
                 "chunk_template": "This should raise a ValueError because it is missing the proper template variables",
diff --git a/tests/unit/rag/test_rag_query.py b/tests/unit/rag/test_rag_query.py
index 05ccecb99..d18d90716 100644
--- a/tests/unit/rag/test_rag_query.py
+++ b/tests/unit/rag/test_rag_query.py
@@ -19,12 +19,16 @@ from llama_stack.providers.inline.tool_runtime.rag.memory import MemoryToolRunti
 
 class TestRagQuery:
     async def test_query_raises_on_empty_vector_db_ids(self):
-        rag_tool = MemoryToolRuntimeImpl(config=MagicMock(), vector_io_api=MagicMock(), inference_api=MagicMock())
+        rag_tool = MemoryToolRuntimeImpl(
+            config=MagicMock(), vector_io_api=MagicMock(), inference_api=MagicMock(), files_api=MagicMock()
+        )
         with pytest.raises(ValueError):
             await rag_tool.query(content=MagicMock(), vector_db_ids=[])
 
     async def test_query_chunk_metadata_handling(self):
-        rag_tool = MemoryToolRuntimeImpl(config=MagicMock(), vector_io_api=MagicMock(), inference_api=MagicMock())
+        rag_tool = MemoryToolRuntimeImpl(
+            config=MagicMock(), vector_io_api=MagicMock(), inference_api=MagicMock(), files_api=MagicMock()
+        )
         content = "test query content"
         vector_db_ids = ["db1"]
 

From d6c3b363904eedd9c5323594603dc4f2d5b581eb Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Sat, 6 Sep 2025 15:22:20 -0400
Subject: [PATCH 22/76] chore: update the gemini inference impl to use
 openai-python for openai-compat functions (#3351)

# What does this PR do?

update the Gemini inference provider to use openai-python for the
openai-compat endpoints

partially addresses #3349, does not address /inference/completion or
/inference/chat-completion

## Test Plan

ci
---
 llama_stack/providers/registry/inference.py             | 2 +-
 llama_stack/providers/remote/inference/gemini/gemini.py | 8 +++++++-
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index 50956f58c..1bb3c3147 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -207,7 +207,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="gemini",
-                pip_packages=["litellm"],
+                pip_packages=["litellm", "openai"],
                 module="llama_stack.providers.remote.inference.gemini",
                 config_class="llama_stack.providers.remote.inference.gemini.GeminiConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.gemini.config.GeminiProviderDataValidator",
diff --git a/llama_stack/providers/remote/inference/gemini/gemini.py b/llama_stack/providers/remote/inference/gemini/gemini.py
index b6048eff7..569227fdd 100644
--- a/llama_stack/providers/remote/inference/gemini/gemini.py
+++ b/llama_stack/providers/remote/inference/gemini/gemini.py
@@ -5,12 +5,13 @@
 # the root directory of this source tree.
 
 from llama_stack.providers.utils.inference.litellm_openai_mixin import LiteLLMOpenAIMixin
+from llama_stack.providers.utils.inference.openai_mixin import OpenAIMixin
 
 from .config import GeminiConfig
 from .models import MODEL_ENTRIES
 
 
-class GeminiInferenceAdapter(LiteLLMOpenAIMixin):
+class GeminiInferenceAdapter(OpenAIMixin, LiteLLMOpenAIMixin):
     def __init__(self, config: GeminiConfig) -> None:
         LiteLLMOpenAIMixin.__init__(
             self,
@@ -21,6 +22,11 @@ class GeminiInferenceAdapter(LiteLLMOpenAIMixin):
         )
         self.config = config
 
+    get_api_key = LiteLLMOpenAIMixin.get_api_key
+
+    def get_base_url(self):
+        return "https://generativelanguage.googleapis.com/v1beta/openai/"
+
     async def initialize(self) -> None:
         await super().initialize()
 

From 4c28544c04ab96c5c4d188dda3a53dc2eab0415d Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Sat, 6 Sep 2025 15:22:44 -0400
Subject: [PATCH 23/76] chore(gemini, tests): add skips for n and completions,
 gemini api does not support them (#3350)

# What does this PR do?

the gemini api endpoints do not support the n param or completions


## Test Plan

ci
---
 tests/integration/inference/test_openai_completion.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index bb447b3c1..099032578 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -37,6 +37,7 @@ def skip_if_model_doesnt_support_openai_completion(client_with_models, model_id)
         "remote::sambanova",
         "remote::tgi",
         "remote::vertexai",
+        "remote::gemini",  # https://generativelanguage.googleapis.com/v1beta/openai/completions -> 404
     ):
         pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support OpenAI completions.")
 
@@ -63,6 +64,9 @@ def skip_if_doesnt_support_n(client_with_models, model_id):
     if provider.provider_type in (
         "remote::sambanova",
         "remote::ollama",
+        # Error code: 400 - [{'error': {'code': 400, 'message': 'Only one candidate can be specified in the
+        # current model', 'status': 'INVALID_ARGUMENT'}}]
+        "remote::gemini",
     ):
         pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support n param.")
 

From bf02cd846fdc39db80291746e06ca547e5afdbdb Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Sat, 6 Sep 2025 15:25:13 -0400
Subject: [PATCH 24/76] chore: update the sambanova inference impl to use
 openai-python for openai-compat functions (#3345)

# What does this PR do?

update SambaNova inference provider to use OpenAIMixin for openai-compat
endpoints

## Test Plan

```
$ SAMBANOVA_API_KEY=... uv run llama stack build --image-type venv --providers inference=remote::sambanova --run
...
$ LLAMA_STACK_CONFIG=http://localhost:8321 uv run --group test pytest -v -ra --text-model sambanova/Meta-Llama-3.3-70B-Instruct tests/integration/inference -k 'not store'
...
FAILED tests/integration/inference/test_text_inference.py::test_text_chat_completion_tool_calling_tools_not_in_request[txt=sambanova/Meta-Llama-3.3-70B-Instruct-inference:chat_completion:tool_calling_tools_absent-True] - AttributeError: 'NoneType' object has no attribute 'delta'
FAILED tests/integration/inference/test_text_inference.py::test_text_chat_completion_tool_calling_tools_not_in_request[txt=sambanova/Meta-Llama-3.3-70B-Instruct-inference:chat_completion:tool_calling_tools_absent-False] - llama_stack_client.InternalServerError: Error code: 500 - {'detail': 'Internal server error: An une...
=========== 2 failed, 16 passed, 68 skipped, 8 deselected, 3 xfailed, 13 warnings in 15.85s ============
```

the two failures also exist before this change. they are part of the
deprecated inference.chat_completion tests that flow through litellm.
they can be resolved later.
---
 llama_stack/providers/registry/inference.py   |  2 +-
 .../remote/inference/sambanova/sambanova.py   | 26 ++++++++++++++++++-
 2 files changed, 26 insertions(+), 2 deletions(-)

diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index 1bb3c3147..7a95fd089 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -270,7 +270,7 @@ Available Models:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="sambanova",
-                pip_packages=["litellm"],
+                pip_packages=["litellm", "openai"],
                 module="llama_stack.providers.remote.inference.sambanova",
                 config_class="llama_stack.providers.remote.inference.sambanova.SambaNovaImplConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.sambanova.config.SambaNovaProviderDataValidator",
diff --git a/llama_stack/providers/remote/inference/sambanova/sambanova.py b/llama_stack/providers/remote/inference/sambanova/sambanova.py
index 96469acac..ee3b0f648 100644
--- a/llama_stack/providers/remote/inference/sambanova/sambanova.py
+++ b/llama_stack/providers/remote/inference/sambanova/sambanova.py
@@ -4,13 +4,26 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 
+
 from llama_stack.providers.utils.inference.litellm_openai_mixin import LiteLLMOpenAIMixin
+from llama_stack.providers.utils.inference.openai_mixin import OpenAIMixin
 
 from .config import SambaNovaImplConfig
 from .models import MODEL_ENTRIES
 
 
-class SambaNovaInferenceAdapter(LiteLLMOpenAIMixin):
+class SambaNovaInferenceAdapter(OpenAIMixin, LiteLLMOpenAIMixin):
+    """
+    SambaNova Inference Adapter for Llama Stack.
+
+    Note: The inheritance order is important here. OpenAIMixin must come before
+    LiteLLMOpenAIMixin to ensure that OpenAIMixin.check_model_availability()
+    is used instead of LiteLLMOpenAIMixin.check_model_availability().
+
+    - OpenAIMixin.check_model_availability() queries the /v1/models to check if a model exists
+    - LiteLLMOpenAIMixin.check_model_availability() checks the static registry within LiteLLM
+    """
+
     def __init__(self, config: SambaNovaImplConfig):
         self.config = config
         self.environment_available_models = []
@@ -24,3 +37,14 @@ class SambaNovaInferenceAdapter(LiteLLMOpenAIMixin):
             download_images=True,  # SambaNova requires base64 image encoding
             json_schema_strict=False,  # SambaNova doesn't support strict=True yet
         )
+
+    # Delegate the client data handling get_api_key method to LiteLLMOpenAIMixin
+    get_api_key = LiteLLMOpenAIMixin.get_api_key
+
+    def get_base_url(self) -> str:
+        """
+        Get the base URL for OpenAI mixin.
+
+        :return: The SambaNova base URL
+        """
+        return self.config.url

From 9252d9fc018487ef7bd6ac400ed329cd5db1e8c4 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Sat, 6 Sep 2025 15:35:30 -0400
Subject: [PATCH 25/76] chore(groq test): skip with_n tests for groq, it is not
 supported server-side (#3346)

# What does this PR do?

skip the with_n test for groq, because it isn't supported by the
provider's service

see
https://console.groq.com/docs/openai#currently-unsupported-openai-features

Co-authored-by: raghotham <rsm@meta.com>
---
 tests/integration/inference/test_openai_completion.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index 099032578..2043f6aeb 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -64,6 +64,9 @@ def skip_if_doesnt_support_n(client_with_models, model_id):
     if provider.provider_type in (
         "remote::sambanova",
         "remote::ollama",
+        # https://console.groq.com/docs/openai#currently-unsupported-openai-features
+        # -> Error code: 400 - {'error': {'message': "'n' : number must be at most 1", 'type': 'invalid_request_error'}}
+        "remote::groq",
         # Error code: 400 - [{'error': {'code': 400, 'message': 'Only one candidate can be specified in the
         # current model', 'status': 'INVALID_ARGUMENT'}}]
         "remote::gemini",

From ecd9d8dc1a70ea70ea06253869392afac3abdb40 Mon Sep 17 00:00:00 2001
From: Charlie Doern <cdoern@redhat.com>
Date: Sat, 6 Sep 2025 15:40:33 -0400
Subject: [PATCH 26/76] test: introduce api conformance test (#3257)

# What does this PR do?

this test runs on each PR and uses a new conformance workflow to compare
the base (main) branch openapi spec to the one on this PR if one of our
"stable" APIs change, the test will fail.

this workflow uses `oasdiff` to identify breaking changes for paths we
want to ensure comptability for.

specifically this is using `oasdiff breaking` with `--match-path` which
only checks breaking changes for the specified paths.

As a follow up to this, we can add an optional way to make it so that it
is OK to make these change if properly documented or in a changelog or
something. or by using a label on the PR to override the failing test.

related to #3237


## Test Plan

conformance test should pass given there are no changes

Signed-off-by: Charlie Doern <cdoern@redhat.com>
---
 .github/workflows/README.md       |  1 +
 .github/workflows/conformance.yml | 57 +++++++++++++++++++++++++++++++
 2 files changed, 58 insertions(+)
 create mode 100644 .github/workflows/conformance.yml

diff --git a/.github/workflows/README.md b/.github/workflows/README.md
index 2e0df58b8..059bb873f 100644
--- a/.github/workflows/README.md
+++ b/.github/workflows/README.md
@@ -5,6 +5,7 @@ Llama Stack uses GitHub Actions for Continuous Integration (CI). Below is a tabl
 | Name | File | Purpose |
 | ---- | ---- | ------- |
 | Update Changelog | [changelog.yml](changelog.yml) | Creates PR for updating the CHANGELOG.md |
+| API Conformance Tests | [conformance.yml](conformance.yml) | Run the API Conformance test suite on the changes. |
 | Installer CI | [install-script-ci.yml](install-script-ci.yml) | Test the installation script |
 | Integration Auth Tests | [integration-auth-tests.yml](integration-auth-tests.yml) | Run the integration test suite with Kubernetes authentication |
 | SqlStore Integration Tests | [integration-sql-store-tests.yml](integration-sql-store-tests.yml) | Run the integration test suite with SqlStore |
diff --git a/.github/workflows/conformance.yml b/.github/workflows/conformance.yml
new file mode 100644
index 000000000..2433b0203
--- /dev/null
+++ b/.github/workflows/conformance.yml
@@ -0,0 +1,57 @@
+# API Conformance Tests
+# This workflow ensures that API changes maintain backward compatibility and don't break existing integrations
+# It runs schema validation and OpenAPI diff checks to catch breaking changes early
+
+name: API Conformance Tests
+
+run-name: Run the API Conformance test suite on the changes.
+
+on:
+  push:
+    branches: [ main ]
+  pull_request:
+    branches: [ main ]
+    types: [opened, synchronize, reopened]
+    paths:
+      - 'llama_stack/**'
+      - '!llama_stack/ui/**'
+      - 'tests/**'
+      - 'uv.lock'
+      - 'pyproject.toml'
+      - '.github/workflows/conformance.yml' # This workflow itself
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref == 'refs/heads/main' && github.run_id || github.ref }}
+  # Cancel in-progress runs when new commits are pushed to avoid wasting CI resources
+  cancel-in-progress: true
+
+jobs:
+  # Job to check if API schema changes maintain backward compatibility
+  check-schema-compatibility:
+    runs-on: ubuntu-latest
+    steps:
+      # Using specific version 4.1.7 because 5.0.0 fails when trying to run this locally using `act`
+      # This ensures consistent behavior between local testing and CI
+      - name: Checkout PR Code
+        uses: actions/checkout@692973e3d937129bcbf40652eb9f2f61becf3332 # v4.1.7
+
+      # Checkout the base branch to compare against (usually main)
+      # This allows us to diff the current changes against the previous state
+      - name: Checkout Base Branch
+        uses: actions/checkout@692973e3d937129bcbf40652eb9f2f61becf3332 # v4.1.7
+        with:
+          ref: ${{ github.event.pull_request.base.ref }}
+          path: 'base'
+
+      # Install oasdiff: https://github.com/oasdiff/oasdiff, a tool for detecting breaking changes in OpenAPI specs.
+      - name: Install oasdiff
+        run: |
+          curl -fsSL https://raw.githubusercontent.com/oasdiff/oasdiff/main/install.sh | sh
+
+      # Run oasdiff to detect breaking changes in the API specification
+      # This step will fail if incompatible changes are detected, preventing breaking changes from being merged
+      - name: Run OpenAPI Breaking Change Diff
+        run: |
+          oasdiff breaking --fail-on ERR base/docs/_static/llama-stack-spec.yaml docs/_static/llama-stack-spec.yaml --match-path '^/v1/openai/v1' \
+          --match-path '^/v1/vector-io' \
+          --match-path '^/v1/vector-dbs'

From d23607483fc8ca63ea15db5a95f672aec249d2e1 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Sat, 6 Sep 2025 18:36:27 -0400
Subject: [PATCH 27/76] chore: update the groq inference impl to use
 openai-python for openai-compat functions (#3348)

# What does this PR do?

update Groq inference provider to use OpenAIMixin for openai-compat
endpoints

changes on api.groq.com -
- json_schema is now supported for specific models, see
https://console.groq.com/docs/structured-outputs#supported-models
- response_format with streaming is now supported for models that
support response_format
- groq no longer returns a 400 error if tools are provided and
tool_choice is not "required"


## Test Plan

```
$ GROQ_API_KEY=... uv run llama stack build --image-type venv --providers inference=remote::groq --run
...
$ LLAMA_STACK_CONFIG=http://localhost:8321 uv run --group test pytest -v -ra --text-model groq/llama-3.3-70b-versatile tests/integration/inference/test_openai_completion.py -k 'not store'
...
SKIPPED [3] tests/integration/inference/test_openai_completion.py:44: Model groq/llama-3.3-70b-versatile hosted by remote::groq doesn't support OpenAI completions.
SKIPPED [3] tests/integration/inference/test_openai_completion.py:94: Model groq/llama-3.3-70b-versatile hosted by remote::groq doesn't support vllm extra_body parameters.
SKIPPED [4] tests/integration/inference/test_openai_completion.py:73: Model groq/llama-3.3-70b-versatile hosted by remote::groq doesn't support n param.
SKIPPED [1] tests/integration/inference/test_openai_completion.py:100: Model groq/llama-3.3-70b-versatile hosted by remote::groq doesn't support chat completion calls with base64 encoded files.
======================= 8 passed, 11 skipped, 8 deselected, 2 warnings in 5.13s ========================
```

---------

Co-authored-by: raghotham <rsm@meta.com>
---
 llama_stack/providers/registry/inference.py   |   2 +-
 .../providers/remote/inference/groq/groq.py   | 139 +-----------------
 .../test_inference_client_caching.py          |   3 +-
 3 files changed, 10 insertions(+), 134 deletions(-)

diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index 7a95fd089..4176f85a6 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -248,7 +248,7 @@ Available Models:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="groq",
-                pip_packages=["litellm"],
+                pip_packages=["litellm", "openai"],
                 module="llama_stack.providers.remote.inference.groq",
                 config_class="llama_stack.providers.remote.inference.groq.GroqConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.groq.config.GroqProviderDataValidator",
diff --git a/llama_stack/providers/remote/inference/groq/groq.py b/llama_stack/providers/remote/inference/groq/groq.py
index fd7212de4..888953af0 100644
--- a/llama_stack/providers/remote/inference/groq/groq.py
+++ b/llama_stack/providers/remote/inference/groq/groq.py
@@ -4,30 +4,15 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 
-from collections.abc import AsyncIterator
-from typing import Any
 
-from openai import AsyncOpenAI
-
-from llama_stack.apis.inference import (
-    OpenAIChatCompletion,
-    OpenAIChatCompletionChunk,
-    OpenAIChoiceDelta,
-    OpenAIChunkChoice,
-    OpenAIMessageParam,
-    OpenAIResponseFormatParam,
-    OpenAISystemMessageParam,
-)
 from llama_stack.providers.remote.inference.groq.config import GroqConfig
 from llama_stack.providers.utils.inference.litellm_openai_mixin import LiteLLMOpenAIMixin
-from llama_stack.providers.utils.inference.openai_compat import (
-    prepare_openai_completion_params,
-)
+from llama_stack.providers.utils.inference.openai_mixin import OpenAIMixin
 
 from .models import MODEL_ENTRIES
 
 
-class GroqInferenceAdapter(LiteLLMOpenAIMixin):
+class GroqInferenceAdapter(OpenAIMixin, LiteLLMOpenAIMixin):
     _config: GroqConfig
 
     def __init__(self, config: GroqConfig):
@@ -40,122 +25,14 @@ class GroqInferenceAdapter(LiteLLMOpenAIMixin):
         )
         self.config = config
 
+    # Delegate the client data handling get_api_key method to LiteLLMOpenAIMixin
+    get_api_key = LiteLLMOpenAIMixin.get_api_key
+
+    def get_base_url(self) -> str:
+        return f"{self.config.url}/openai/v1"
+
     async def initialize(self):
         await super().initialize()
 
     async def shutdown(self):
         await super().shutdown()
-
-    def _get_openai_client(self) -> AsyncOpenAI:
-        return AsyncOpenAI(
-            base_url=f"{self.config.url}/openai/v1",
-            api_key=self.get_api_key(),
-        )
-
-    async def openai_chat_completion(
-        self,
-        model: str,
-        messages: list[OpenAIMessageParam],
-        frequency_penalty: float | None = None,
-        function_call: str | dict[str, Any] | None = None,
-        functions: list[dict[str, Any]] | None = None,
-        logit_bias: dict[str, float] | None = None,
-        logprobs: bool | None = None,
-        max_completion_tokens: int | None = None,
-        max_tokens: int | None = None,
-        n: int | None = None,
-        parallel_tool_calls: bool | None = None,
-        presence_penalty: float | None = None,
-        response_format: OpenAIResponseFormatParam | None = None,
-        seed: int | None = None,
-        stop: str | list[str] | None = None,
-        stream: bool | None = None,
-        stream_options: dict[str, Any] | None = None,
-        temperature: float | None = None,
-        tool_choice: str | dict[str, Any] | None = None,
-        tools: list[dict[str, Any]] | None = None,
-        top_logprobs: int | None = None,
-        top_p: float | None = None,
-        user: str | None = None,
-    ) -> OpenAIChatCompletion | AsyncIterator[OpenAIChatCompletionChunk]:
-        model_obj = await self.model_store.get_model(model)
-
-        # Groq does not support json_schema response format, so we need to convert it to json_object
-        if response_format and response_format.type == "json_schema":
-            response_format.type = "json_object"
-            schema = response_format.json_schema.get("schema", {})
-            response_format.json_schema = None
-            json_instructions = f"\nYour response should be a JSON object that matches the following schema: {schema}"
-            if messages and messages[0].role == "system":
-                messages[0].content = messages[0].content + json_instructions
-            else:
-                messages.insert(0, OpenAISystemMessageParam(content=json_instructions))
-
-        # Groq returns a 400 error if tools are provided but none are called
-        # So, set tool_choice to "required" to attempt to force a call
-        if tools and (not tool_choice or tool_choice == "auto"):
-            tool_choice = "required"
-
-        params = await prepare_openai_completion_params(
-            model=model_obj.provider_resource_id,
-            messages=messages,
-            frequency_penalty=frequency_penalty,
-            function_call=function_call,
-            functions=functions,
-            logit_bias=logit_bias,
-            logprobs=logprobs,
-            max_completion_tokens=max_completion_tokens,
-            max_tokens=max_tokens,
-            n=n,
-            parallel_tool_calls=parallel_tool_calls,
-            presence_penalty=presence_penalty,
-            response_format=response_format,
-            seed=seed,
-            stop=stop,
-            stream=stream,
-            stream_options=stream_options,
-            temperature=temperature,
-            tool_choice=tool_choice,
-            tools=tools,
-            top_logprobs=top_logprobs,
-            top_p=top_p,
-            user=user,
-        )
-
-        # Groq does not support streaming requests that set response_format
-        fake_stream = False
-        if stream and response_format:
-            params["stream"] = False
-            fake_stream = True
-
-        response = await self._get_openai_client().chat.completions.create(**params)
-
-        if fake_stream:
-            chunk_choices = []
-            for choice in response.choices:
-                delta = OpenAIChoiceDelta(
-                    content=choice.message.content,
-                    role=choice.message.role,
-                    tool_calls=choice.message.tool_calls,
-                )
-                chunk_choice = OpenAIChunkChoice(
-                    delta=delta,
-                    finish_reason=choice.finish_reason,
-                    index=choice.index,
-                    logprobs=None,
-                )
-                chunk_choices.append(chunk_choice)
-            chunk = OpenAIChatCompletionChunk(
-                id=response.id,
-                choices=chunk_choices,
-                object="chat.completion.chunk",
-                created=response.created,
-                model=response.model,
-            )
-
-            async def _fake_stream_generator():
-                yield chunk
-
-            return _fake_stream_generator()
-        else:
-            return response
diff --git a/tests/unit/providers/inference/test_inference_client_caching.py b/tests/unit/providers/inference/test_inference_client_caching.py
index b371cf907..f4b3201e9 100644
--- a/tests/unit/providers/inference/test_inference_client_caching.py
+++ b/tests/unit/providers/inference/test_inference_client_caching.py
@@ -33,8 +33,7 @@ def test_groq_provider_openai_client_caching():
         with request_provider_data_context(
             {"x-llamastack-provider-data": json.dumps({inference_adapter.provider_data_api_key_field: api_key})}
         ):
-            openai_client = inference_adapter._get_openai_client()
-            assert openai_client.api_key == api_key
+            assert inference_adapter.client.api_key == api_key
 
 
 def test_openai_provider_openai_client_caching():

From 78cab5331a78d27b084a04c0d8e302a51d5d2c4d Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Sat, 6 Sep 2025 19:21:55 -0400
Subject: [PATCH 28/76] chore(groq test): skip completions tests for groq, api
 is not supported server-side (#3347)

# What does this PR do?

skip /v1/completions tests on groq, endpoint is not supported

Co-authored-by: raghotham <rsm@meta.com>
---
 tests/integration/inference/test_openai_completion.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index 2043f6aeb..aee75b21d 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -37,6 +37,9 @@ def skip_if_model_doesnt_support_openai_completion(client_with_models, model_id)
         "remote::sambanova",
         "remote::tgi",
         "remote::vertexai",
+        # {"error":{"message":"Unknown request URL: GET /openai/v1/completions. Please check the URL for typos,
+        # or see the docs at https://console.groq.com/docs/","type":"invalid_request_error","code":"unknown_url"}}
+        "remote::groq",
         "remote::gemini",  # https://generativelanguage.googleapis.com/v1beta/openai/completions -> 404
     ):
         pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support OpenAI completions.")

From 6a35bd7bb6186d2ee60bbc3de0e2a349b12796f0 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Sun, 7 Sep 2025 17:00:42 -0400
Subject: [PATCH 29/76] chore: update the anthropic inference impl to use
 openai-python for openai-compat functions (#3366)

# What does this PR do?

update the Anthropic inference provider to use openai-python for the
openai-compat endpoints

## Test Plan

ci

Co-authored-by: raghotham <rsm@meta.com>
---
 .../providers/remote/inference/anthropic/anthropic.py     | 8 +++++++-
 tests/integration/inference/test_openai_completion.py     | 3 +++
 2 files changed, 10 insertions(+), 1 deletion(-)

diff --git a/llama_stack/providers/remote/inference/anthropic/anthropic.py b/llama_stack/providers/remote/inference/anthropic/anthropic.py
index 31626082b..0f247218d 100644
--- a/llama_stack/providers/remote/inference/anthropic/anthropic.py
+++ b/llama_stack/providers/remote/inference/anthropic/anthropic.py
@@ -5,12 +5,13 @@
 # the root directory of this source tree.
 
 from llama_stack.providers.utils.inference.litellm_openai_mixin import LiteLLMOpenAIMixin
+from llama_stack.providers.utils.inference.openai_mixin import OpenAIMixin
 
 from .config import AnthropicConfig
 from .models import MODEL_ENTRIES
 
 
-class AnthropicInferenceAdapter(LiteLLMOpenAIMixin):
+class AnthropicInferenceAdapter(OpenAIMixin, LiteLLMOpenAIMixin):
     def __init__(self, config: AnthropicConfig) -> None:
         LiteLLMOpenAIMixin.__init__(
             self,
@@ -26,3 +27,8 @@ class AnthropicInferenceAdapter(LiteLLMOpenAIMixin):
 
     async def shutdown(self) -> None:
         await super().shutdown()
+
+    get_api_key = LiteLLMOpenAIMixin.get_api_key
+
+    def get_base_url(self):
+        return "https://api.anthropic.com/v1"
diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index aee75b21d..df1184f1c 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -41,6 +41,7 @@ def skip_if_model_doesnt_support_openai_completion(client_with_models, model_id)
         # or see the docs at https://console.groq.com/docs/","type":"invalid_request_error","code":"unknown_url"}}
         "remote::groq",
         "remote::gemini",  # https://generativelanguage.googleapis.com/v1beta/openai/completions -> 404
+        "remote::anthropic",  # at least claude-3-{5,7}-{haiku,sonnet}-* / claude-{sonnet,opus}-4-* are not supported
     ):
         pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support OpenAI completions.")
 
@@ -73,6 +74,8 @@ def skip_if_doesnt_support_n(client_with_models, model_id):
         # Error code: 400 - [{'error': {'code': 400, 'message': 'Only one candidate can be specified in the
         # current model', 'status': 'INVALID_ARGUMENT'}}]
         "remote::gemini",
+        # https://docs.anthropic.com/en/api/openai-sdk#simple-fields
+        "remote::anthropic",
     ):
         pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support n param.")
 

From fe134d90e5488725da179d5283f126787d61a89b Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 09:58:45 +0200
Subject: [PATCH 30/76] chore(ui-deps): bump react-dom and @types/react-dom in
 /llama_stack/ui (#3360)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps
[react-dom](https://github.com/facebook/react/tree/HEAD/packages/react-dom)
and
[@types/react-dom](https://github.com/DefinitelyTyped/DefinitelyTyped/tree/HEAD/types/react-dom).
These dependencies needed to be updated together.
Updates `react-dom` from 19.1.0 to 19.1.1
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/facebook/react/releases">react-dom's
releases</a>.</em></p>
<blockquote>
<h2>19.1.1 (July 28, 2025)</h2>
<h3>React</h3>
<ul>
<li>Fixed Owner Stacks to work with ES2015 function.name semantics (<a
href="https://redirect.github.com/facebook/react/pull/33680">#33680</a>
by <a href="https://github.com/hoxyq"><code>@​hoxyq</code></a>)</li>
</ul>
</blockquote>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a
href="https://github.com/facebook/react/blob/main/CHANGELOG.md">react-dom's
changelog</a>.</em></p>
<blockquote>
<h2>19.1.1 (July 28, 2025)</h2>
<h3>React</h3>
<ul>
<li>Fixed Owner Stacks to work with ES2015 function.name semantics (<a
href="https://redirect.github.com/facebook/react/pull/33680">#33680</a>
by <a href="https://github.com/hoxyq"><code>@​hoxyq</code></a>)</li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/facebook/react/commit/87e33ca2b7c4479342091ae642f01266af7ebec9"><code>87e33ca</code></a>
Set release versions to 19.1.1</li>
<li><a
href="https://github.com/facebook/react/commit/b793948e15ff714fadea026dcaef9385dce14a19"><code>b793948</code></a>
Bump next prerelease version numbers (<a
href="https://github.com/facebook/react/tree/HEAD/packages/react-dom/issues/32782">#32782</a>)</li>
<li>See full diff in <a
href="https://github.com/facebook/react/commits/v19.1.1/packages/react-dom">compare
view</a></li>
</ul>
</details>
<br />

Updates `@types/react-dom` from 19.1.5 to 19.1.9
<details>
<summary>Commits</summary>
<ul>
<li>See full diff in <a
href="https://github.com/DefinitelyTyped/DefinitelyTyped/commits/HEAD/types/react-dom">compare
view</a></li>
</ul>
</details>
<br />


Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 llama_stack/ui/package-lock.json | 22 +++++++++++-----------
 llama_stack/ui/package.json      |  2 +-
 2 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/llama_stack/ui/package-lock.json b/llama_stack/ui/package-lock.json
index 7873cdfd5..05ccdb708 100644
--- a/llama_stack/ui/package-lock.json
+++ b/llama_stack/ui/package-lock.json
@@ -24,7 +24,7 @@
         "next-auth": "^4.24.11",
         "next-themes": "^0.4.6",
         "react": "^19.0.0",
-        "react-dom": "^19.0.0",
+        "react-dom": "^19.1.1",
         "react-markdown": "^10.1.0",
         "remark-gfm": "^4.0.1",
         "remeda": "^2.30.0",
@@ -4079,9 +4079,9 @@
       }
     },
     "node_modules/@types/react-dom": {
-      "version": "19.1.5",
-      "resolved": "https://registry.npmjs.org/@types/react-dom/-/react-dom-19.1.5.tgz",
-      "integrity": "sha512-CMCjrWucUBZvohgZxkjd6S9h0nZxXjzus6yDfUb+xLxYM7VvjKNH1tQrE9GWLql1XoOP4/Ds3bwFqShHUYraGg==",
+      "version": "19.1.9",
+      "resolved": "https://registry.npmjs.org/@types/react-dom/-/react-dom-19.1.9.tgz",
+      "integrity": "sha512-qXRuZaOsAdXKFyOhRBg6Lqqc0yay13vN7KrIg4L7N4aaHN68ma9OK3NE1BoDFgFOTfM7zg+3/8+2n8rLUH3OKQ==",
       "devOptional": true,
       "license": "MIT",
       "peerDependencies": {
@@ -12448,24 +12448,24 @@
       }
     },
     "node_modules/react": {
-      "version": "19.1.0",
-      "resolved": "https://registry.npmjs.org/react/-/react-19.1.0.tgz",
-      "integrity": "sha512-FS+XFBNvn3GTAWq26joslQgWNoFu08F4kl0J4CgdNKADkdSGXQyTCnKteIAJy96Br6YbpEU1LSzV5dYtjMkMDg==",
+      "version": "19.1.1",
+      "resolved": "https://registry.npmjs.org/react/-/react-19.1.1.tgz",
+      "integrity": "sha512-w8nqGImo45dmMIfljjMwOGtbmC/mk4CMYhWIicdSflH91J9TyCyczcPFXJzrZ/ZXcgGRFeP6BU0BEJTw6tZdfQ==",
       "license": "MIT",
       "engines": {
         "node": ">=0.10.0"
       }
     },
     "node_modules/react-dom": {
-      "version": "19.1.0",
-      "resolved": "https://registry.npmjs.org/react-dom/-/react-dom-19.1.0.tgz",
-      "integrity": "sha512-Xs1hdnE+DyKgeHJeJznQmYMIBG3TKIHJJT95Q58nHLSrElKlGQqDTR2HQ9fx5CN/Gk6Vh/kupBTDLU11/nDk/g==",
+      "version": "19.1.1",
+      "resolved": "https://registry.npmjs.org/react-dom/-/react-dom-19.1.1.tgz",
+      "integrity": "sha512-Dlq/5LAZgF0Gaz6yiqZCf6VCcZs1ghAJyrsu84Q/GT0gV+mCxbfmKNoGRKBYMJ8IEdGPqu49YWXD02GCknEDkw==",
       "license": "MIT",
       "dependencies": {
         "scheduler": "^0.26.0"
       },
       "peerDependencies": {
-        "react": "^19.1.0"
+        "react": "^19.1.1"
       }
     },
     "node_modules/react-is": {
diff --git a/llama_stack/ui/package.json b/llama_stack/ui/package.json
index b37ff233f..558a9fe2f 100644
--- a/llama_stack/ui/package.json
+++ b/llama_stack/ui/package.json
@@ -29,7 +29,7 @@
     "next-auth": "^4.24.11",
     "next-themes": "^0.4.6",
     "react": "^19.0.0",
-    "react-dom": "^19.0.0",
+    "react-dom": "^19.1.1",
     "react-markdown": "^10.1.0",
     "remark-gfm": "^4.0.1",
     "remeda": "^2.30.0",

From 91c7c4570e3abc3f9571795a8fd6ae520a0d9853 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 09:59:02 +0200
Subject: [PATCH 31/76] chore(ui-deps): bump sonner from 2.0.6 to 2.0.7 in
 /llama_stack/ui (#3364)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps [sonner](https://github.com/emilkowalski/sonner) from 2.0.6 to
2.0.7.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/emilkowalski/sonner/releases">sonner's
releases</a>.</em></p>
<blockquote>
<h2>v2.0.7</h2>
<p>Sonner now supports multiple <code>&lt;Toaster /&gt;</code>
components, see more <a
href="https://sonner.emilkowal.ski/toaster#multiple-toasters">here</a>.</p>
<h2>What's Changed</h2>
<ul>
<li>feat: add testId prop for individual toast components by <a
href="https://github.com/b-like-bahar"><code>@​b-like-bahar</code></a>
in <a
href="https://redirect.github.com/emilkowalski/sonner/pull/660">emilkowalski/sonner#660</a></li>
<li>feat(toaster): add support for multiple toasters with unique
identifiers by <a
href="https://github.com/taroj1205"><code>@​taroj1205</code></a> in <a
href="https://redirect.github.com/emilkowalski/sonner/pull/665">emilkowalski/sonner#665</a></li>
<li>fix: tests by <a
href="https://github.com/emilkowalski"><code>@​emilkowalski</code></a>
in <a
href="https://redirect.github.com/emilkowalski/sonner/pull/677">emilkowalski/sonner#677</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a
href="https://github.com/b-like-bahar"><code>@​b-like-bahar</code></a>
made their first contribution in <a
href="https://redirect.github.com/emilkowalski/sonner/pull/660">emilkowalski/sonner#660</a></li>
<li><a href="https://github.com/taroj1205"><code>@​taroj1205</code></a>
made their first contribution in <a
href="https://redirect.github.com/emilkowalski/sonner/pull/665">emilkowalski/sonner#665</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/emilkowalski/sonner/compare/v2.0.6...v2.0.7">https://github.com/emilkowalski/sonner/compare/v2.0.6...v2.0.7</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/emilkowalski/sonner/commit/3ba7aa17ab7e8101b9cf4893936f873b0d4769b3"><code>3ba7aa1</code></a>
v2.0.7</li>
<li><a
href="https://github.com/emilkowalski/sonner/commit/06048270633a4f0cb954688d571e7bed2bc597f4"><code>0604827</code></a>
fix: tests (<a
href="https://redirect.github.com/emilkowalski/sonner/issues/677">#677</a>)</li>
<li><a
href="https://github.com/emilkowalski/sonner/commit/c50fe92dfb5bc42163ab418a274c86e47ba8dd5e"><code>c50fe92</code></a>
fix tests</li>
<li><a
href="https://github.com/emilkowalski/sonner/commit/0600a5cb4040e38ac7972f6bcd0895b150e51949"><code>0600a5c</code></a>
feat(toaster): add support for multiple toasters with unique identifiers
(<a
href="https://redirect.github.com/emilkowalski/sonner/issues/665">#665</a>)</li>
<li><a
href="https://github.com/emilkowalski/sonner/commit/c14bf44a0363105c4d2232d426412ba28c7edca6"><code>c14bf44</code></a>
feat: add testId prop for individual toast components (<a
href="https://redirect.github.com/emilkowalski/sonner/issues/660">#660</a>)</li>
<li>See full diff in <a
href="https://github.com/emilkowalski/sonner/compare/v2.0.6...v2.0.7">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=sonner&package-manager=npm_and_yarn&previous-version=2.0.6&new-version=2.0.7)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 llama_stack/ui/package-lock.json | 8 ++++----
 llama_stack/ui/package.json      | 2 +-
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/llama_stack/ui/package-lock.json b/llama_stack/ui/package-lock.json
index 05ccdb708..f0ca72e92 100644
--- a/llama_stack/ui/package-lock.json
+++ b/llama_stack/ui/package-lock.json
@@ -29,7 +29,7 @@
         "remark-gfm": "^4.0.1",
         "remeda": "^2.30.0",
         "shiki": "^1.29.2",
-        "sonner": "^2.0.6",
+        "sonner": "^2.0.7",
         "tailwind-merge": "^3.3.1"
       },
       "devDependencies": {
@@ -13285,9 +13285,9 @@
       }
     },
     "node_modules/sonner": {
-      "version": "2.0.6",
-      "resolved": "https://registry.npmjs.org/sonner/-/sonner-2.0.6.tgz",
-      "integrity": "sha512-yHFhk8T/DK3YxjFQXIrcHT1rGEeTLliVzWbO0xN8GberVun2RiBnxAjXAYpZrqwEVHBG9asI/Li8TAAhN9m59Q==",
+      "version": "2.0.7",
+      "resolved": "https://registry.npmjs.org/sonner/-/sonner-2.0.7.tgz",
+      "integrity": "sha512-W6ZN4p58k8aDKA4XPcx2hpIQXBRAgyiWVkYhT7CvK6D3iAu7xjvVyhQHg2/iaKJZ1XVJ4r7XuwGL+WGEK37i9w==",
       "license": "MIT",
       "peerDependencies": {
         "react": "^18.0.0 || ^19.0.0 || ^19.0.0-rc",
diff --git a/llama_stack/ui/package.json b/llama_stack/ui/package.json
index 558a9fe2f..6f35fc83f 100644
--- a/llama_stack/ui/package.json
+++ b/llama_stack/ui/package.json
@@ -34,7 +34,7 @@
     "remark-gfm": "^4.0.1",
     "remeda": "^2.30.0",
     "shiki": "^1.29.2",
-    "sonner": "^2.0.6",
+    "sonner": "^2.0.7",
     "tailwind-merge": "^3.3.1"
   },
   "devDependencies": {

From e508aef320f209d8ed9bb37c64a1fc5be35c05db Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 09:59:24 +0200
Subject: [PATCH 32/76] chore(ui-deps): bump lucide-react from 0.510.0 to
 0.542.0 in /llama_stack/ui (#3363)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps
[lucide-react](https://github.com/lucide-icons/lucide/tree/HEAD/packages/lucide-react)
from 0.510.0 to 0.542.0.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/lucide-icons/lucide/releases">lucide-react's
releases</a>.</em></p>
<blockquote>
<h2>Version 0.542.0</h2>
<h2>What's Changed</h2>
<ul>
<li>feat(docs): add MDN Web Docs &amp; Nuxt to showcase by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3590">lucide-icons/lucide#3590</a></li>
<li>feat(icons): added <code>list-chevrons-down-up</code> icon by <a
href="https://github.com/juliankellydesign"><code>@​juliankellydesign</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3492">lucide-icons/lucide#3492</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a
href="https://github.com/juliankellydesign"><code>@​juliankellydesign</code></a>
made their first contribution in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3492">lucide-icons/lucide#3492</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/lucide-icons/lucide/compare/0.541.0...0.542.0">https://github.com/lucide-icons/lucide/compare/0.541.0...0.542.0</a></p>
<h2>Version 0.541.0</h2>
<h2>What's Changed</h2>
<ul>
<li>feat(packages/lucide): added support for providing a custom root
element by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3543">lucide-icons/lucide#3543</a></li>
<li>fix(icons): optimized <code>chrome</code> icon &amp; renamed to
<code>chromium</code> by <a
href="https://github.com/jguddas"><code>@​jguddas</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3572">lucide-icons/lucide#3572</a></li>
<li>fix(icons): changed <code>wallpaper</code> icon by <a
href="https://github.com/jguddas"><code>@​jguddas</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3566">lucide-icons/lucide#3566</a></li>
<li>fix(icons): optimized <code>cog</code> icon by <a
href="https://github.com/jguddas"><code>@​jguddas</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3548">lucide-icons/lucide#3548</a></li>
<li>fix(icons): changed <code>building</code> icon by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3510">lucide-icons/lucide#3510</a></li>
<li>feat(dpi-preview): add previous version for easier comparison by <a
href="https://github.com/jguddas"><code>@​jguddas</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3532">lucide-icons/lucide#3532</a></li>
<li>feat(icons): added 'panel-dashed' variants + update tags on existing
icons by <a
href="https://github.com/irvineacosta"><code>@​irvineacosta</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3500">lucide-icons/lucide#3500</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/lucide-icons/lucide/compare/0.540.0...0.541.0">https://github.com/lucide-icons/lucide/compare/0.540.0...0.541.0</a></p>
<h2>Version 0.540.0</h2>
<h2>What's Changed</h2>
<ul>
<li>fix(license): add full text of Feather license by <a
href="https://github.com/jguddas"><code>@​jguddas</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3530">lucide-icons/lucide#3530</a></li>
<li>fix(icons): changed <code>umbrella</code> icon by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3490">lucide-icons/lucide#3490</a></li>
<li>docs(site): added official statement on brand logos in Lucide by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3541">lucide-icons/lucide#3541</a></li>
<li>fix(icons): changed <code>camera</code> icon by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3539">lucide-icons/lucide#3539</a></li>
<li>feat(icons): added <code>rose</code> icon by <a
href="https://github.com/jguddas"><code>@​jguddas</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/1972">lucide-icons/lucide#1972</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/lucide-icons/lucide/compare/0.539.0...0.540.0">https://github.com/lucide-icons/lucide/compare/0.539.0...0.540.0</a></p>
<h2>Version 0.539.0</h2>
<h2>What's Changed</h2>
<ul>
<li>feat(icons): added <code>brick-wall-shield</code> icon by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3476">lucide-icons/lucide#3476</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/lucide-icons/lucide/compare/0.538.0...0.539.0">https://github.com/lucide-icons/lucide/compare/0.538.0...0.539.0</a></p>
<h2>Version 0.538.0</h2>
<h2>What's Changed</h2>
<ul>
<li>fix(icons): changed <code>apple</code> icon by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3505">lucide-icons/lucide#3505</a></li>
<li>fix(icons): changed <code>store</code> icon by <a
href="https://github.com/karsa-mistmere"><code>@​karsa-mistmere</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3501">lucide-icons/lucide#3501</a></li>
<li>fix(icons): changed <code>mic-off</code> icon by <a
href="https://github.com/lieonlion"><code>@​lieonlion</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/2823">lucide-icons/lucide#2823</a></li>
<li>chore(deps): bump astro from 5.5.2 to 5.12.8 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3523">lucide-icons/lucide#3523</a></li>
<li>fix(icons): deprecate rail-symbol by <a
href="https://github.com/jguddas"><code>@​jguddas</code></a> in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/2862">lucide-icons/lucide#2862</a></li>
<li>feat(icons): added <code>kayak</code> icon by <a
href="https://github.com/jpjacobpadilla"><code>@​jpjacobpadilla</code></a>
in <a
href="https://redirect.github.com/lucide-icons/lucide/pull/3054">lucide-icons/lucide#3054</a></li>
</ul>
<!-- raw HTML omitted -->
</blockquote>
<p>... (truncated)</p>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/lucide-icons/lucide/commit/e71198d9b3e3db42c02e9006a61289a7766520f6"><code>e71198d</code></a>
chore: icon alias improvements (<a
href="https://github.com/lucide-icons/lucide/tree/HEAD/packages/lucide-react/issues/2861">#2861</a>)</li>
<li><a
href="https://github.com/lucide-icons/lucide/commit/3e644fda2d8763207165d1dc64fdcdc37d40dc71"><code>3e644fd</code></a>
chore(scripts): Refactor scripts to typescript (<a
href="https://github.com/lucide-icons/lucide/tree/HEAD/packages/lucide-react/issues/3316">#3316</a>)</li>
<li><a
href="https://github.com/lucide-icons/lucide/commit/19fa01b5fca2fc4a9cd0a77e4e9a0122b949813b"><code>19fa01b</code></a>
build(deps-dev): bump vite from 6.3.2 to 6.3.4 (<a
href="https://github.com/lucide-icons/lucide/tree/HEAD/packages/lucide-react/issues/3181">#3181</a>)</li>
<li>See full diff in <a
href="https://github.com/lucide-icons/lucide/commits/0.542.0/packages/lucide-react">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=lucide-react&package-manager=npm_and_yarn&previous-version=0.510.0&new-version=0.542.0)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 llama_stack/ui/package-lock.json | 8 ++++----
 llama_stack/ui/package.json      | 2 +-
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/llama_stack/ui/package-lock.json b/llama_stack/ui/package-lock.json
index f0ca72e92..198b98fdf 100644
--- a/llama_stack/ui/package-lock.json
+++ b/llama_stack/ui/package-lock.json
@@ -19,7 +19,7 @@
         "clsx": "^2.1.1",
         "framer-motion": "^12.23.12",
         "llama-stack-client": "^0.2.20",
-        "lucide-react": "^0.510.0",
+        "lucide-react": "^0.542.0",
         "next": "15.3.3",
         "next-auth": "^4.24.11",
         "next-themes": "^0.4.6",
@@ -10240,9 +10240,9 @@
       "license": "ISC"
     },
     "node_modules/lucide-react": {
-      "version": "0.510.0",
-      "resolved": "https://registry.npmjs.org/lucide-react/-/lucide-react-0.510.0.tgz",
-      "integrity": "sha512-p8SQRAMVh7NhsAIETokSqDrc5CHnDLbV29mMnzaXx+Vc/hnqQzwI2r0FMWCcoTXnbw2KEjy48xwpGdEL+ck06Q==",
+      "version": "0.542.0",
+      "resolved": "https://registry.npmjs.org/lucide-react/-/lucide-react-0.542.0.tgz",
+      "integrity": "sha512-w3hD8/SQB7+lzU2r4VdFyzzOzKnUjTZIF/MQJGSSvni7Llewni4vuViRppfRAa2guOsY5k4jZyxw/i9DQHv+dw==",
       "license": "ISC",
       "peerDependencies": {
         "react": "^16.5.1 || ^17.0.0 || ^18.0.0 || ^19.0.0"
diff --git a/llama_stack/ui/package.json b/llama_stack/ui/package.json
index 6f35fc83f..f892f4f9b 100644
--- a/llama_stack/ui/package.json
+++ b/llama_stack/ui/package.json
@@ -24,7 +24,7 @@
     "clsx": "^2.1.1",
     "framer-motion": "^12.23.12",
     "llama-stack-client": "^0.2.20",
-    "lucide-react": "^0.510.0",
+    "lucide-react": "^0.542.0",
     "next": "15.3.3",
     "next-auth": "^4.24.11",
     "next-themes": "^0.4.6",

From e1b81ce1fc4820480a95471bbe0f504a952110b6 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 09:59:44 +0200
Subject: [PATCH 33/76] chore(ui-deps): bump @radix-ui/react-dropdown-menu from
 2.1.14 to 2.1.16 in /llama_stack/ui (#3361)

Bumps
[@radix-ui/react-dropdown-menu](https://github.com/radix-ui/primitives)
from 2.1.14 to 2.1.16.
<details>
<summary>Commits</summary>
<ul>
<li>See full diff in <a
href="https://github.com/radix-ui/primitives/commits">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=@radix-ui/react-dropdown-menu&package-manager=npm_and_yarn&previous-version=2.1.14&new-version=2.1.16)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 llama_stack/ui/package-lock.json | 443 ++++++++++++++++++++-----------
 llama_stack/ui/package.json      |   2 +-
 2 files changed, 288 insertions(+), 157 deletions(-)

diff --git a/llama_stack/ui/package-lock.json b/llama_stack/ui/package-lock.json
index 198b98fdf..cbe8e5557 100644
--- a/llama_stack/ui/package-lock.json
+++ b/llama_stack/ui/package-lock.json
@@ -10,7 +10,7 @@
       "dependencies": {
         "@radix-ui/react-collapsible": "^1.1.12",
         "@radix-ui/react-dialog": "^1.1.13",
-        "@radix-ui/react-dropdown-menu": "^2.1.14",
+        "@radix-ui/react-dropdown-menu": "^2.1.16",
         "@radix-ui/react-select": "^2.2.5",
         "@radix-ui/react-separator": "^1.1.7",
         "@radix-ui/react-slot": "^1.2.3",
@@ -2066,12 +2066,35 @@
       "license": "MIT"
     },
     "node_modules/@radix-ui/react-arrow": {
-      "version": "1.1.6",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-arrow/-/react-arrow-1.1.6.tgz",
-      "integrity": "sha512-2JMfHJf/eVnwq+2dewT3C0acmCWD3XiVA1Da+jTDqo342UlU13WvXtqHhG+yJw5JeQmu4ue2eMy6gcEArLBlcw==",
+      "version": "1.1.7",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-arrow/-/react-arrow-1.1.7.tgz",
+      "integrity": "sha512-F+M1tLhO+mlQaOWspE8Wstg+z6PwxwRd8oQ8IXceWz92kfAmalTRf0EjrouQeo7QssEPfCn05B4Ihs1K9WQ/7w==",
       "license": "MIT",
       "dependencies": {
-        "@radix-ui/react-primitive": "2.1.2"
+        "@radix-ui/react-primitive": "2.1.3"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/@radix-ui/react-arrow/node_modules/@radix-ui/react-primitive": {
+      "version": "2.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-primitive/-/react-primitive-2.1.3.tgz",
+      "integrity": "sha512-m9gTwRkhy2lvCPe6QJp4d3G1TYEUHn/FzJUtq9MjH46an1wJU+GdoGC5VLof8RX8Ft/DlpshApkhswDLZzHIcQ==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-slot": "1.2.3"
       },
       "peerDependencies": {
         "@types/react": "*",
@@ -2172,15 +2195,15 @@
       }
     },
     "node_modules/@radix-ui/react-collection": {
-      "version": "1.1.6",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-collection/-/react-collection-1.1.6.tgz",
-      "integrity": "sha512-PbhRFK4lIEw9ADonj48tiYWzkllz81TM7KVYyyMMw2cwHO7D5h4XKEblL8NlaRisTK3QTe6tBEhDccFUryxHBQ==",
+      "version": "1.1.7",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-collection/-/react-collection-1.1.7.tgz",
+      "integrity": "sha512-Fh9rGN0MoI4ZFUNyfFVNU4y9LUz93u9/0K+yLgA2bwRojxM8JU1DyvvMBabnZPBgMWREAJvU2jjVzq+LrFUglw==",
       "license": "MIT",
       "dependencies": {
         "@radix-ui/react-compose-refs": "1.1.2",
         "@radix-ui/react-context": "1.1.2",
-        "@radix-ui/react-primitive": "2.1.2",
-        "@radix-ui/react-slot": "1.2.2"
+        "@radix-ui/react-primitive": "2.1.3",
+        "@radix-ui/react-slot": "1.2.3"
       },
       "peerDependencies": {
         "@types/react": "*",
@@ -2197,21 +2220,26 @@
         }
       }
     },
-    "node_modules/@radix-ui/react-collection/node_modules/@radix-ui/react-slot": {
-      "version": "1.2.2",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-slot/-/react-slot-1.2.2.tgz",
-      "integrity": "sha512-y7TBO4xN4Y94FvcWIOIh18fM4R1A8S4q1jhoz4PNzOoHsFcN8pogcFmZrTYAm4F9VRUrWP/Mw7xSKybIeRI+CQ==",
+    "node_modules/@radix-ui/react-collection/node_modules/@radix-ui/react-primitive": {
+      "version": "2.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-primitive/-/react-primitive-2.1.3.tgz",
+      "integrity": "sha512-m9gTwRkhy2lvCPe6QJp4d3G1TYEUHn/FzJUtq9MjH46an1wJU+GdoGC5VLof8RX8Ft/DlpshApkhswDLZzHIcQ==",
       "license": "MIT",
       "dependencies": {
-        "@radix-ui/react-compose-refs": "1.1.2"
+        "@radix-ui/react-slot": "1.2.3"
       },
       "peerDependencies": {
         "@types/react": "*",
-        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
       },
       "peerDependenciesMeta": {
         "@types/react": {
           "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
         }
       }
     },
@@ -2342,17 +2370,17 @@
       }
     },
     "node_modules/@radix-ui/react-dropdown-menu": {
-      "version": "2.1.14",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-dropdown-menu/-/react-dropdown-menu-2.1.14.tgz",
-      "integrity": "sha512-lzuyNjoWOoaMFE/VC5FnAAYM16JmQA8ZmucOXtlhm2kKR5TSU95YLAueQ4JYuRmUJmBvSqXaVFGIfuukybwZJQ==",
+      "version": "2.1.16",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-dropdown-menu/-/react-dropdown-menu-2.1.16.tgz",
+      "integrity": "sha512-1PLGQEynI/3OX/ftV54COn+3Sud/Mn8vALg2rWnBLnRaGtJDduNW/22XjlGgPdpcIbiQxjKtb7BkcjP00nqfJw==",
       "license": "MIT",
       "dependencies": {
-        "@radix-ui/primitive": "1.1.2",
+        "@radix-ui/primitive": "1.1.3",
         "@radix-ui/react-compose-refs": "1.1.2",
         "@radix-ui/react-context": "1.1.2",
         "@radix-ui/react-id": "1.1.1",
-        "@radix-ui/react-menu": "2.1.14",
-        "@radix-ui/react-primitive": "2.1.2",
+        "@radix-ui/react-menu": "2.1.16",
+        "@radix-ui/react-primitive": "2.1.3",
         "@radix-ui/react-use-controllable-state": "1.2.2"
       },
       "peerDependencies": {
@@ -2370,6 +2398,35 @@
         }
       }
     },
+    "node_modules/@radix-ui/react-dropdown-menu/node_modules/@radix-ui/primitive": {
+      "version": "1.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/primitive/-/primitive-1.1.3.tgz",
+      "integrity": "sha512-JTF99U/6XIjCBo0wqkU5sK10glYe27MRRsfwoiq5zzOEZLHU3A3KCMa5X/azekYRCJ0HlwI0crAXS/5dEHTzDg==",
+      "license": "MIT"
+    },
+    "node_modules/@radix-ui/react-dropdown-menu/node_modules/@radix-ui/react-primitive": {
+      "version": "2.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-primitive/-/react-primitive-2.1.3.tgz",
+      "integrity": "sha512-m9gTwRkhy2lvCPe6QJp4d3G1TYEUHn/FzJUtq9MjH46an1wJU+GdoGC5VLof8RX8Ft/DlpshApkhswDLZzHIcQ==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-slot": "1.2.3"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/@radix-ui/react-focus-guards": {
       "version": "1.1.2",
       "resolved": "https://registry.npmjs.org/@radix-ui/react-focus-guards/-/react-focus-guards-1.1.2.tgz",
@@ -2429,26 +2486,26 @@
       }
     },
     "node_modules/@radix-ui/react-menu": {
-      "version": "2.1.14",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-menu/-/react-menu-2.1.14.tgz",
-      "integrity": "sha512-0zSiBAIFq9GSKoSH5PdEaQeRB3RnEGxC+H2P0egtnKoKKLNBH8VBHyVO6/jskhjAezhOIplyRUj7U2lds9A+Yg==",
+      "version": "2.1.16",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-menu/-/react-menu-2.1.16.tgz",
+      "integrity": "sha512-72F2T+PLlphrqLcAotYPp0uJMr5SjP5SL01wfEspJbru5Zs5vQaSHb4VB3ZMJPimgHHCHG7gMOeOB9H3Hdmtxg==",
       "license": "MIT",
       "dependencies": {
-        "@radix-ui/primitive": "1.1.2",
-        "@radix-ui/react-collection": "1.1.6",
+        "@radix-ui/primitive": "1.1.3",
+        "@radix-ui/react-collection": "1.1.7",
         "@radix-ui/react-compose-refs": "1.1.2",
         "@radix-ui/react-context": "1.1.2",
         "@radix-ui/react-direction": "1.1.1",
-        "@radix-ui/react-dismissable-layer": "1.1.9",
-        "@radix-ui/react-focus-guards": "1.1.2",
-        "@radix-ui/react-focus-scope": "1.1.6",
+        "@radix-ui/react-dismissable-layer": "1.1.11",
+        "@radix-ui/react-focus-guards": "1.1.3",
+        "@radix-ui/react-focus-scope": "1.1.7",
         "@radix-ui/react-id": "1.1.1",
-        "@radix-ui/react-popper": "1.2.6",
-        "@radix-ui/react-portal": "1.1.8",
-        "@radix-ui/react-presence": "1.1.4",
-        "@radix-ui/react-primitive": "2.1.2",
-        "@radix-ui/react-roving-focus": "1.1.9",
-        "@radix-ui/react-slot": "1.2.2",
+        "@radix-ui/react-popper": "1.2.8",
+        "@radix-ui/react-portal": "1.1.9",
+        "@radix-ui/react-presence": "1.1.5",
+        "@radix-ui/react-primitive": "2.1.3",
+        "@radix-ui/react-roving-focus": "1.1.11",
+        "@radix-ui/react-slot": "1.2.3",
         "@radix-ui/react-use-callback-ref": "1.1.1",
         "aria-hidden": "^1.2.4",
         "react-remove-scroll": "^2.6.3"
@@ -2468,14 +2525,44 @@
         }
       }
     },
-    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/react-slot": {
-      "version": "1.2.2",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-slot/-/react-slot-1.2.2.tgz",
-      "integrity": "sha512-y7TBO4xN4Y94FvcWIOIh18fM4R1A8S4q1jhoz4PNzOoHsFcN8pogcFmZrTYAm4F9VRUrWP/Mw7xSKybIeRI+CQ==",
+    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/primitive": {
+      "version": "1.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/primitive/-/primitive-1.1.3.tgz",
+      "integrity": "sha512-JTF99U/6XIjCBo0wqkU5sK10glYe27MRRsfwoiq5zzOEZLHU3A3KCMa5X/azekYRCJ0HlwI0crAXS/5dEHTzDg==",
+      "license": "MIT"
+    },
+    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/react-dismissable-layer": {
+      "version": "1.1.11",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-dismissable-layer/-/react-dismissable-layer-1.1.11.tgz",
+      "integrity": "sha512-Nqcp+t5cTB8BinFkZgXiMJniQH0PsUt2k51FUhbdfeKvc4ACcG2uQniY/8+h1Yv6Kza4Q7lD7PQV0z0oicE0Mg==",
       "license": "MIT",
       "dependencies": {
-        "@radix-ui/react-compose-refs": "1.1.2"
+        "@radix-ui/primitive": "1.1.3",
+        "@radix-ui/react-compose-refs": "1.1.2",
+        "@radix-ui/react-primitive": "2.1.3",
+        "@radix-ui/react-use-callback-ref": "1.1.1",
+        "@radix-ui/react-use-escape-keydown": "1.1.1"
       },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/react-focus-guards": {
+      "version": "1.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-focus-guards/-/react-focus-guards-1.1.3.tgz",
+      "integrity": "sha512-0rFg/Rj2Q62NCm62jZw0QX7a3sz6QCQU0LpZdNrJX8byRGaGVTqbrW9jAoIAHyMQqsNpeZ81YgSizOt5WXq0Pw==",
+      "license": "MIT",
       "peerDependencies": {
         "@types/react": "*",
         "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
@@ -2486,17 +2573,113 @@
         }
       }
     },
+    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/react-focus-scope": {
+      "version": "1.1.7",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-focus-scope/-/react-focus-scope-1.1.7.tgz",
+      "integrity": "sha512-t2ODlkXBQyn7jkl6TNaw/MtVEVvIGelJDCG41Okq/KwUsJBwQ4XVZsHAVUkK4mBv3ewiAS3PGuUWuY2BoK4ZUw==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-compose-refs": "1.1.2",
+        "@radix-ui/react-primitive": "2.1.3",
+        "@radix-ui/react-use-callback-ref": "1.1.1"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/react-portal": {
+      "version": "1.1.9",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-portal/-/react-portal-1.1.9.tgz",
+      "integrity": "sha512-bpIxvq03if6UNwXZ+HTK71JLh4APvnXntDc6XOX8UVq4XQOVl7lwok0AvIl+b8zgCw3fSaVTZMpAPPagXbKmHQ==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-primitive": "2.1.3",
+        "@radix-ui/react-use-layout-effect": "1.1.1"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/react-presence": {
+      "version": "1.1.5",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-presence/-/react-presence-1.1.5.tgz",
+      "integrity": "sha512-/jfEwNDdQVBCNvjkGit4h6pMOzq8bHkopq458dPt2lMjx+eBQUohZNG9A7DtO/O5ukSbxuaNGXMjHicgwy6rQQ==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-compose-refs": "1.1.2",
+        "@radix-ui/react-use-layout-effect": "1.1.1"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/@radix-ui/react-menu/node_modules/@radix-ui/react-primitive": {
+      "version": "2.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-primitive/-/react-primitive-2.1.3.tgz",
+      "integrity": "sha512-m9gTwRkhy2lvCPe6QJp4d3G1TYEUHn/FzJUtq9MjH46an1wJU+GdoGC5VLof8RX8Ft/DlpshApkhswDLZzHIcQ==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-slot": "1.2.3"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/@radix-ui/react-popper": {
-      "version": "1.2.6",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-popper/-/react-popper-1.2.6.tgz",
-      "integrity": "sha512-7iqXaOWIjDBfIG7aq8CUEeCSsQMLFdn7VEE8TaFz704DtEzpPHR7w/uuzRflvKgltqSAImgcmxQ7fFX3X7wasg==",
+      "version": "1.2.8",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-popper/-/react-popper-1.2.8.tgz",
+      "integrity": "sha512-0NJQ4LFFUuWkE7Oxf0htBKS6zLkkjBH+hM1uk7Ng705ReR8m/uelduy1DBo0PyBXPKVnBA6YBlU94MBGXrSBCw==",
       "license": "MIT",
       "dependencies": {
         "@floating-ui/react-dom": "^2.0.0",
-        "@radix-ui/react-arrow": "1.1.6",
+        "@radix-ui/react-arrow": "1.1.7",
         "@radix-ui/react-compose-refs": "1.1.2",
         "@radix-ui/react-context": "1.1.2",
-        "@radix-ui/react-primitive": "2.1.2",
+        "@radix-ui/react-primitive": "2.1.3",
         "@radix-ui/react-use-callback-ref": "1.1.1",
         "@radix-ui/react-use-layout-effect": "1.1.1",
         "@radix-ui/react-use-rect": "1.1.1",
@@ -2518,6 +2701,29 @@
         }
       }
     },
+    "node_modules/@radix-ui/react-popper/node_modules/@radix-ui/react-primitive": {
+      "version": "2.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-primitive/-/react-primitive-2.1.3.tgz",
+      "integrity": "sha512-m9gTwRkhy2lvCPe6QJp4d3G1TYEUHn/FzJUtq9MjH46an1wJU+GdoGC5VLof8RX8Ft/DlpshApkhswDLZzHIcQ==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-slot": "1.2.3"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/@radix-ui/react-portal": {
       "version": "1.1.8",
       "resolved": "https://registry.npmjs.org/@radix-ui/react-portal/-/react-portal-1.1.8.tgz",
@@ -2608,18 +2814,18 @@
       }
     },
     "node_modules/@radix-ui/react-roving-focus": {
-      "version": "1.1.9",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-roving-focus/-/react-roving-focus-1.1.9.tgz",
-      "integrity": "sha512-ZzrIFnMYHHCNqSNCsuN6l7wlewBEq0O0BCSBkabJMFXVO51LRUTq71gLP1UxFvmrXElqmPjA5VX7IqC9VpazAQ==",
+      "version": "1.1.11",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-roving-focus/-/react-roving-focus-1.1.11.tgz",
+      "integrity": "sha512-7A6S9jSgm/S+7MdtNDSb+IU859vQqJ/QAtcYQcfFC6W8RS4IxIZDldLR0xqCFZ6DCyrQLjLPsxtTNch5jVA4lA==",
       "license": "MIT",
       "dependencies": {
-        "@radix-ui/primitive": "1.1.2",
-        "@radix-ui/react-collection": "1.1.6",
+        "@radix-ui/primitive": "1.1.3",
+        "@radix-ui/react-collection": "1.1.7",
         "@radix-ui/react-compose-refs": "1.1.2",
         "@radix-ui/react-context": "1.1.2",
         "@radix-ui/react-direction": "1.1.1",
         "@radix-ui/react-id": "1.1.1",
-        "@radix-ui/react-primitive": "2.1.2",
+        "@radix-ui/react-primitive": "2.1.3",
         "@radix-ui/react-use-callback-ref": "1.1.1",
         "@radix-ui/react-use-controllable-state": "1.2.2"
       },
@@ -2638,6 +2844,35 @@
         }
       }
     },
+    "node_modules/@radix-ui/react-roving-focus/node_modules/@radix-ui/primitive": {
+      "version": "1.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/primitive/-/primitive-1.1.3.tgz",
+      "integrity": "sha512-JTF99U/6XIjCBo0wqkU5sK10glYe27MRRsfwoiq5zzOEZLHU3A3KCMa5X/azekYRCJ0HlwI0crAXS/5dEHTzDg==",
+      "license": "MIT"
+    },
+    "node_modules/@radix-ui/react-roving-focus/node_modules/@radix-ui/react-primitive": {
+      "version": "2.1.3",
+      "resolved": "https://registry.npmjs.org/@radix-ui/react-primitive/-/react-primitive-2.1.3.tgz",
+      "integrity": "sha512-m9gTwRkhy2lvCPe6QJp4d3G1TYEUHn/FzJUtq9MjH46an1wJU+GdoGC5VLof8RX8Ft/DlpshApkhswDLZzHIcQ==",
+      "license": "MIT",
+      "dependencies": {
+        "@radix-ui/react-slot": "1.2.3"
+      },
+      "peerDependencies": {
+        "@types/react": "*",
+        "@types/react-dom": "*",
+        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
+        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
+      },
+      "peerDependenciesMeta": {
+        "@types/react": {
+          "optional": true
+        },
+        "@types/react-dom": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/@radix-ui/react-select": {
       "version": "2.2.5",
       "resolved": "https://registry.npmjs.org/@radix-ui/react-select/-/react-select-2.2.5.tgz",
@@ -2681,55 +2916,6 @@
         }
       }
     },
-    "node_modules/@radix-ui/react-select/node_modules/@radix-ui/react-arrow": {
-      "version": "1.1.7",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-arrow/-/react-arrow-1.1.7.tgz",
-      "integrity": "sha512-F+M1tLhO+mlQaOWspE8Wstg+z6PwxwRd8oQ8IXceWz92kfAmalTRf0EjrouQeo7QssEPfCn05B4Ihs1K9WQ/7w==",
-      "license": "MIT",
-      "dependencies": {
-        "@radix-ui/react-primitive": "2.1.3"
-      },
-      "peerDependencies": {
-        "@types/react": "*",
-        "@types/react-dom": "*",
-        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
-        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
-      },
-      "peerDependenciesMeta": {
-        "@types/react": {
-          "optional": true
-        },
-        "@types/react-dom": {
-          "optional": true
-        }
-      }
-    },
-    "node_modules/@radix-ui/react-select/node_modules/@radix-ui/react-collection": {
-      "version": "1.1.7",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-collection/-/react-collection-1.1.7.tgz",
-      "integrity": "sha512-Fh9rGN0MoI4ZFUNyfFVNU4y9LUz93u9/0K+yLgA2bwRojxM8JU1DyvvMBabnZPBgMWREAJvU2jjVzq+LrFUglw==",
-      "license": "MIT",
-      "dependencies": {
-        "@radix-ui/react-compose-refs": "1.1.2",
-        "@radix-ui/react-context": "1.1.2",
-        "@radix-ui/react-primitive": "2.1.3",
-        "@radix-ui/react-slot": "1.2.3"
-      },
-      "peerDependencies": {
-        "@types/react": "*",
-        "@types/react-dom": "*",
-        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
-        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
-      },
-      "peerDependenciesMeta": {
-        "@types/react": {
-          "optional": true
-        },
-        "@types/react-dom": {
-          "optional": true
-        }
-      }
-    },
     "node_modules/@radix-ui/react-select/node_modules/@radix-ui/react-dismissable-layer": {
       "version": "1.1.10",
       "resolved": "https://registry.npmjs.org/@radix-ui/react-dismissable-layer/-/react-dismissable-layer-1.1.10.tgz",
@@ -2965,29 +3151,6 @@
       "integrity": "sha512-JTF99U/6XIjCBo0wqkU5sK10glYe27MRRsfwoiq5zzOEZLHU3A3KCMa5X/azekYRCJ0HlwI0crAXS/5dEHTzDg==",
       "license": "MIT"
     },
-    "node_modules/@radix-ui/react-tooltip/node_modules/@radix-ui/react-arrow": {
-      "version": "1.1.7",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-arrow/-/react-arrow-1.1.7.tgz",
-      "integrity": "sha512-F+M1tLhO+mlQaOWspE8Wstg+z6PwxwRd8oQ8IXceWz92kfAmalTRf0EjrouQeo7QssEPfCn05B4Ihs1K9WQ/7w==",
-      "license": "MIT",
-      "dependencies": {
-        "@radix-ui/react-primitive": "2.1.3"
-      },
-      "peerDependencies": {
-        "@types/react": "*",
-        "@types/react-dom": "*",
-        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
-        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
-      },
-      "peerDependenciesMeta": {
-        "@types/react": {
-          "optional": true
-        },
-        "@types/react-dom": {
-          "optional": true
-        }
-      }
-    },
     "node_modules/@radix-ui/react-tooltip/node_modules/@radix-ui/react-dismissable-layer": {
       "version": "1.1.11",
       "resolved": "https://registry.npmjs.org/@radix-ui/react-dismissable-layer/-/react-dismissable-layer-1.1.11.tgz",
@@ -3015,38 +3178,6 @@
         }
       }
     },
-    "node_modules/@radix-ui/react-tooltip/node_modules/@radix-ui/react-popper": {
-      "version": "1.2.8",
-      "resolved": "https://registry.npmjs.org/@radix-ui/react-popper/-/react-popper-1.2.8.tgz",
-      "integrity": "sha512-0NJQ4LFFUuWkE7Oxf0htBKS6zLkkjBH+hM1uk7Ng705ReR8m/uelduy1DBo0PyBXPKVnBA6YBlU94MBGXrSBCw==",
-      "license": "MIT",
-      "dependencies": {
-        "@floating-ui/react-dom": "^2.0.0",
-        "@radix-ui/react-arrow": "1.1.7",
-        "@radix-ui/react-compose-refs": "1.1.2",
-        "@radix-ui/react-context": "1.1.2",
-        "@radix-ui/react-primitive": "2.1.3",
-        "@radix-ui/react-use-callback-ref": "1.1.1",
-        "@radix-ui/react-use-layout-effect": "1.1.1",
-        "@radix-ui/react-use-rect": "1.1.1",
-        "@radix-ui/react-use-size": "1.1.1",
-        "@radix-ui/rect": "1.1.1"
-      },
-      "peerDependencies": {
-        "@types/react": "*",
-        "@types/react-dom": "*",
-        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
-        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
-      },
-      "peerDependenciesMeta": {
-        "@types/react": {
-          "optional": true
-        },
-        "@types/react-dom": {
-          "optional": true
-        }
-      }
-    },
     "node_modules/@radix-ui/react-tooltip/node_modules/@radix-ui/react-portal": {
       "version": "1.1.9",
       "resolved": "https://registry.npmjs.org/@radix-ui/react-portal/-/react-portal-1.1.9.tgz",
diff --git a/llama_stack/ui/package.json b/llama_stack/ui/package.json
index f892f4f9b..e817e9ae3 100644
--- a/llama_stack/ui/package.json
+++ b/llama_stack/ui/package.json
@@ -15,7 +15,7 @@
   "dependencies": {
     "@radix-ui/react-collapsible": "^1.1.12",
     "@radix-ui/react-dialog": "^1.1.13",
-    "@radix-ui/react-dropdown-menu": "^2.1.14",
+    "@radix-ui/react-dropdown-menu": "^2.1.16",
     "@radix-ui/react-select": "^2.2.5",
     "@radix-ui/react-separator": "^1.1.7",
     "@radix-ui/react-slot": "^1.2.3",

From 51012a82a38e6b8aa2b31907487cacbfd1d8b645 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 10:00:41 +0200
Subject: [PATCH 34/76] chore(github-deps): bump astral-sh/setup-uv from 6.6.0
 to 6.6.1 (#3355)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps [astral-sh/setup-uv](https://github.com/astral-sh/setup-uv) from
6.6.0 to 6.6.1.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/astral-sh/setup-uv/releases">astral-sh/setup-uv's
releases</a>.</em></p>
<blockquote>
<h2>v6.6.1 🌈 Fix exclusions in cache-dependency-glob</h2>
<h2>Changes</h2>
<p>Exclusions with a leading <code>!</code> in the <a
href="https://github.com/astral-sh/setup-uv?tab=readme-ov-file#cache-dependency-glob">cache-dependency-glob</a>
did not work and got fixed with this release. Thank you <a
href="https://github.com/KnisterPeter"><code>@​KnisterPeter</code></a>
for raising this!</p>
<h2>🐛 Bug fixes</h2>
<ul>
<li>Fix exclusions in cache-dependency-glob <a
href="https://github.com/eifinger"><code>@​eifinger</code></a> (<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/546">#546</a>)</li>
</ul>
<h2>🧰 Maintenance</h2>
<ul>
<li>Bump dependencies <a
href="https://github.com/eifinger"><code>@​eifinger</code></a> (<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/547">#547</a>)</li>
<li>chore: update known versions for 0.8.14 @<a
href="https://github.com/apps/github-actions">github-actions[bot]</a>
(<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/543">#543</a>)</li>
<li>chore: update known versions for 0.8.13 @<a
href="https://github.com/apps/github-actions">github-actions[bot]</a>
(<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/536">#536</a>)</li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/astral-sh/setup-uv/commit/557e51de59eb14aaaba2ed9621916900a91d50c6"><code>557e51d</code></a>
Bump dependencies (<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/547">#547</a>)</li>
<li><a
href="https://github.com/astral-sh/setup-uv/commit/1b46e13ec88163c255691015b7e7afec7535b06a"><code>1b46e13</code></a>
Fix exclusions in cache-dependency-glob (<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/546">#546</a>)</li>
<li><a
href="https://github.com/astral-sh/setup-uv/commit/26cf676705ba2848bf75ebd447bb297a435baee3"><code>26cf676</code></a>
chore: update known versions for 0.8.14 (<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/543">#543</a>)</li>
<li><a
href="https://github.com/astral-sh/setup-uv/commit/4e1e303f7dafb1a3ec7770a507052543f593ad96"><code>4e1e303</code></a>
chore: update known versions for 0.8.13 (<a
href="https://redirect.github.com/astral-sh/setup-uv/issues/536">#536</a>)</li>
<li>See full diff in <a
href="https://github.com/astral-sh/setup-uv/compare/4959332f0f014c5280e7eac8b70c90cb574c9f9b...557e51de59eb14aaaba2ed9621916900a91d50c6">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=astral-sh/setup-uv&package-manager=github_actions&previous-version=6.6.0&new-version=6.6.1)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/python-build-test.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/python-build-test.yml b/.github/workflows/python-build-test.yml
index bf9a3e057..00f0950c7 100644
--- a/.github/workflows/python-build-test.yml
+++ b/.github/workflows/python-build-test.yml
@@ -24,7 +24,7 @@ jobs:
       uses: actions/checkout@08c6903cd8c0fde910a37f88322edcfb5dd907a8 # v5.0.0
 
     - name: Install uv
-      uses: astral-sh/setup-uv@4959332f0f014c5280e7eac8b70c90cb574c9f9b # v6.6.0
+      uses: astral-sh/setup-uv@557e51de59eb14aaaba2ed9621916900a91d50c6 # v6.6.1
       with:
         python-version: ${{ matrix.python-version }}
         activate-environment: true

From 2f91344c1faf8fdb10b31d74cba07d46de694382 Mon Sep 17 00:00:00 2001
From: Yuan Tang <terrytangyuan@gmail.com>
Date: Mon, 8 Sep 2025 04:01:41 -0400
Subject: [PATCH 35/76] docs: Update changelog (#3343)

This updates the changelog doc to include the latest updates.

Signed-off-by: Yuan Tang <terrytangyuan@gmail.com>
---
 CHANGELOG.md | 98 ++++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 98 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 2f47c3ae3..c51a1b2aa 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,103 @@
 # Changelog
 
+# v0.2.20
+Published on: 2025-08-29T22:25:32Z
+
+Here are some key changes that are coming as part of this release.
+
+### Build and Environment
+
+- Environment improvements: fixed env var replacement to preserve types.
+- Docker stability: fixed container startup failures for Fireworks AI provider.
+- Removed absolute paths in build for better portability.
+
+### Features
+
+- UI Enhancements: Implemented file upload and VectorDB creation/configuration directly in UI.
+- Vector Store Improvements: Added keyword, vector, and hybrid search inside vector store.
+- Added S3 authorization support for file providers.
+- SQL Store: Added inequality support to where clause.
+
+### Documentation
+
+- Fixed post-training docs.
+- Added Contributor Guidelines for creating Internal vs. External providers.
+
+### Fixes
+
+- Removed unsupported bfcl scoring function.
+- Multiple reliability and configuration fixes for providers and environment handling.
+
+### Engineering / Chores
+
+- Cleaner internal development setup with consistent paths.
+- Incremental improvements to provider integration and vector store behavior.
+
+
+### New Contributors
+- @omertuc made their first contribution in #3270
+- @r3v5 made their first contribution in vector store hybrid search
+
+---
+
+# v0.2.19
+Published on: 2025-08-26T22:06:55Z
+
+## Highlights
+* feat: Add CORS configuration support for server by @skamenan7 in https://github.com/llamastack/llama-stack/pull/3201
+* feat(api): introduce /rerank by @ehhuang in https://github.com/llamastack/llama-stack/pull/2940
+* feat: Add S3 Files Provider by @mattf in https://github.com/llamastack/llama-stack/pull/3202
+
+
+---
+
+# v0.2.18
+Published on: 2025-08-20T01:09:27Z
+
+## Highlights
+* Add moderations create API
+* Hybrid search in Milvus
+* Numerous Responses API improvements
+* Documentation updates
+
+
+---
+
+# v0.2.17
+Published on: 2025-08-05T01:51:14Z
+
+## Highlights
+
+* feat(tests): introduce inference record/replay to increase test reliability by @ashwinb in https://github.com/meta-llama/llama-stack/pull/2941
+* fix(library_client): improve initialization error handling and prevent AttributeError by @mattf in https://github.com/meta-llama/llama-stack/pull/2944
+* fix: use OLLAMA_URL to activate Ollama provider in starter by @ashwinb in https://github.com/meta-llama/llama-stack/pull/2963
+* feat(UI): adding MVP playground UI by @franciscojavierarceo in https://github.com/meta-llama/llama-stack/pull/2828
+* Standardization of errors (@nathan-weinberg)
+* feat: Enable DPO training with HuggingFace inline provider by @Nehanth in https://github.com/meta-llama/llama-stack/pull/2825
+* chore: rename templates to distributions by @ashwinb in https://github.com/meta-llama/llama-stack/pull/3035
+
+
+---
+
+# v0.2.16
+Published on: 2025-07-28T23:35:23Z
+
+## Highlights
+
+* Automatic model registration for self-hosted providers (ollama and vllm currently). No need for `INFERENCE_MODEL` environment variables which need to be updated, etc.
+* Much simplified starter distribution. Most `ENABLE_` env variables are now gone. When you set `VLLM_URL`, the `vllm` provider is auto-enabled. Similar for `MILVUS_URL`, `PGVECTOR_DB`, etc. Check the [run.yaml](https://github.com/meta-llama/llama-stack/blob/main/llama_stack/templates/starter/run.yaml) for more details.
+* All tests migrated to pytest now (thanks @Elbehery)
+* DPO implementation in the post-training provider (thanks @Nehanth)
+* (Huge!) Support for external APIs and providers thereof (thanks @leseb, @cdoern and others). This is a really big deal -- you can now add more APIs completely out of tree and experiment with them before (optionally) wanting to contribute back.
+* `inline::vllm` provider is gone thank you very much
+* several improvements to OpenAI inference implementations and LiteLLM backend (thanks @mattf)
+* Chroma now supports Vector Store API (thanks @franciscojavierarceo).
+* Authorization improvements: Vector Store/File APIs now supports access control (thanks @franciscojavierarceo); Telemetry read APIs are gated according to logged-in user's roles.
+
+
+
+---
+
 # v0.2.15
 Published on: 2025-07-16T03:30:01Z
 

From 58c61d85c86029bf0935b6f21d1750117ef861ac Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 10:04:41 +0200
Subject: [PATCH 36/76] chore(github-deps): bump actions/stale from 9.1.0 to
 10.0.0 (#3352)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps [actions/stale](https://github.com/actions/stale) from 9.1.0 to
10.0.0.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/actions/stale/releases">actions/stale's
releases</a>.</em></p>
<blockquote>
<h2>v10.0.0</h2>
<h2>What's Changed</h2>
<h3>Breaking Changes</h3>
<ul>
<li>Upgrade to node 24 by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/stale/pull/1279">actions/stale#1279</a>
Make sure your runner is on version v2.327.1 or later to ensure
compatibility with this release. <a
href="https://github.com/actions/runner/releases/tag/v2.327.1">Release
Notes</a></li>
</ul>
<h3>Enhancement</h3>
<ul>
<li>Introducing sort-by option by <a
href="https://github.com/suyashgaonkar"><code>@​suyashgaonkar</code></a>
in <a
href="https://redirect.github.com/actions/stale/pull/1254">actions/stale#1254</a></li>
</ul>
<h3>Dependency Upgrades</h3>
<ul>
<li>Upgrade actions/publish-immutable-action from 0.0.3 to 0.0.4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/stale/pull/1186">actions/stale#1186</a></li>
<li>Upgrade undici from 5.28.4 to 5.28.5 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/stale/pull/1201">actions/stale#1201</a></li>
<li>Upgrade <code>@​action/cache</code> from 4.0.0 to 4.0.2 by <a
href="https://github.com/aparnajyothi-y"><code>@​aparnajyothi-y</code></a>
in <a
href="https://redirect.github.com/actions/stale/pull/1226">actions/stale#1226</a></li>
<li>Upgrade <code>@​action/cache</code> from 4.0.2 to 4.0.3 by <a
href="https://github.com/suyashgaonkar"><code>@​suyashgaonkar</code></a>
in <a
href="https://redirect.github.com/actions/stale/pull/1233">actions/stale#1233</a></li>
<li>Upgrade undici from 5.28.5 to 5.29.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/stale/pull/1251">actions/stale#1251</a></li>
<li>Upgrade form-data to bring in fix for critical vulnerability by <a
href="https://github.com/gowridurgad"><code>@​gowridurgad</code></a> in
<a
href="https://redirect.github.com/actions/stale/pull/1277">actions/stale#1277</a></li>
</ul>
<h3>Documentation changes</h3>
<ul>
<li>Changelog update for recent releases by <a
href="https://github.com/suyashgaonkar"><code>@​suyashgaonkar</code></a>
in <a
href="https://redirect.github.com/actions/stale/pull/1224">actions/stale#1224</a></li>
<li>Permissions update in Readme by <a
href="https://github.com/ghadimir"><code>@​ghadimir</code></a> in <a
href="https://redirect.github.com/actions/stale/pull/1248">actions/stale#1248</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a
href="https://github.com/suyashgaonkar"><code>@​suyashgaonkar</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/stale/pull/1224">actions/stale#1224</a></li>
<li><a href="https://github.com/GhadimiR"><code>@​GhadimiR</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/stale/pull/1248">actions/stale#1248</a></li>
<li><a
href="https://github.com/gowridurgad"><code>@​gowridurgad</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/stale/pull/1277">actions/stale#1277</a></li>
<li><a href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/stale/pull/1279">actions/stale#1279</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/actions/stale/compare/v9...v10.0.0">https://github.com/actions/stale/compare/v9...v10.0.0</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/actions/stale/commit/3a9db7e6a41a89f618792c92c0e97cc736e1b13f"><code>3a9db7e</code></a>
Upgrade to node 24 (<a
href="https://redirect.github.com/actions/stale/issues/1279">#1279</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/8f717f0dfca33b78d3c933452e42558e4456c8e7"><code>8f717f0</code></a>
Bumps form-data (<a
href="https://redirect.github.com/actions/stale/issues/1277">#1277</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/a92fd57ffeff1a7d5e9f90394c229c1cebb74321"><code>a92fd57</code></a>
build(deps): bump undici from 5.28.5 to 5.29.0 (<a
href="https://redirect.github.com/actions/stale/issues/1251">#1251</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/128b2c81d01bedfe5b59d56fc08176aecd3fe6b9"><code>128b2c8</code></a>
Introducing sort-by option (<a
href="https://redirect.github.com/actions/stale/issues/1254">#1254</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/f78de9780efb7a789cf4745957fa3374cbb94fd5"><code>f78de97</code></a>
Update README.md (<a
href="https://redirect.github.com/actions/stale/issues/1248">#1248</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/816d9db1aba399a7f70277f1a2b01a4d21497fdd"><code>816d9db</code></a>
Upgrade <code>@​action/cache</code> from 4.0.2 to 4.0.3 (<a
href="https://redirect.github.com/actions/stale/issues/1233">#1233</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/ba23c1cb02e5cb8f885b0994d870e6032be00186"><code>ba23c1c</code></a>
upgrade actions/cache from 4.0.0 to 4.0.2 (<a
href="https://redirect.github.com/actions/stale/issues/1226">#1226</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/a65e88a9b971cb99d742d9a25b2f8614e10577e9"><code>a65e88a</code></a>
build(deps): bump undici from 5.28.4 to 5.28.5 (<a
href="https://redirect.github.com/actions/stale/issues/1201">#1201</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/d4df79c5919b10352b8f29b9699b7acdc5500ebc"><code>d4df79c</code></a>
Updates to CHANGELOG.MD for recent releases (<a
href="https://redirect.github.com/actions/stale/issues/1224">#1224</a>)</li>
<li><a
href="https://github.com/actions/stale/commit/ee7ef89499a3de6e4fe1fc1acb994e67c64e0a2a"><code>ee7ef89</code></a>
build(deps): bump actions/publish-immutable-action from 0.0.3 to 0.0.4
(<a
href="https://redirect.github.com/actions/stale/issues/1186">#1186</a>)</li>
<li>See full diff in <a
href="https://github.com/actions/stale/compare/5bef64f19d7facfb25b37b414482c7164d639639...3a9db7e6a41a89f618792c92c0e97cc736e1b13f">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=actions/stale&package-manager=github_actions&previous-version=9.1.0&new-version=10.0.0)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/stale_bot.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/stale_bot.yml b/.github/workflows/stale_bot.yml
index 087df72d7..502a78f8e 100644
--- a/.github/workflows/stale_bot.yml
+++ b/.github/workflows/stale_bot.yml
@@ -24,7 +24,7 @@ jobs:
     runs-on: ubuntu-latest
     steps:
       - name: Stale Action
-        uses: actions/stale@5bef64f19d7facfb25b37b414482c7164d639639 # v9.1.0
+        uses: actions/stale@3a9db7e6a41a89f618792c92c0e97cc736e1b13f # v10.0.0
         with:
           stale-issue-label: 'stale'
           stale-issue-message: >

From dfa13d68f193b7f701c725d705251458c065e64a Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 10:05:00 +0200
Subject: [PATCH 37/76] chore(github-deps): bump actions/setup-node from 4.4.0
 to 5.0.0 (#3353)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps [actions/setup-node](https://github.com/actions/setup-node) from
4.4.0 to 5.0.0.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/actions/setup-node/releases">actions/setup-node's
releases</a>.</em></p>
<blockquote>
<h2>v5.0.0</h2>
<h2>What's Changed</h2>
<h3>Breaking Changes</h3>
<ul>
<li>Enhance caching in setup-node with automatic package manager
detection by <a
href="https://github.com/priya-kinthali"><code>@​priya-kinthali</code></a>
in <a
href="https://redirect.github.com/actions/setup-node/pull/1348">actions/setup-node#1348</a></li>
</ul>
<p>This update, introduces automatic caching when a valid
<code>packageManager</code> field is present in your
<code>package.json</code>. This aims to improve workflow performance and
make dependency management more seamless. To disable this automatic
caching,
set <code>package-manager-cache: false</code></p>
<pre lang="yaml"><code>steps:
- uses: actions/checkout@v5
- uses: actions/setup-node@v5
  with:
    package-manager-cache: false
</code></pre>
<ul>
<li>Upgrade action to use node24 by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/setup-node/pull/1325">actions/setup-node#1325</a></li>
</ul>
<p>Make sure your runner is on version v2.327.1 or later to ensure
compatibility with this release. <a
href="https://github.com/actions/runner/releases/tag/v2.327.1">See
Release Notes</a></p>
<h3>Dependency Upgrades</h3>
<ul>
<li>Upgrade <code>@​octokit/request-error</code> and
<code>@​actions/github</code> by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/setup-node/pull/1227">actions/setup-node#1227</a></li>
<li>Upgrade uuid from 9.0.1 to 11.1.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/setup-node/pull/1273">actions/setup-node#1273</a></li>
<li>Upgrade undici from 5.28.5 to 5.29.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/setup-node/pull/1295">actions/setup-node#1295</a></li>
<li>Upgrade form-data to bring in fix for critical vulnerability by <a
href="https://github.com/gowridurgad"><code>@​gowridurgad</code></a> in
<a
href="https://redirect.github.com/actions/setup-node/pull/1332">actions/setup-node#1332</a></li>
<li>Upgrade actions/checkout from 4 to 5 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/setup-node/pull/1345">actions/setup-node#1345</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a
href="https://github.com/priya-kinthali"><code>@​priya-kinthali</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/setup-node/pull/1348">actions/setup-node#1348</a></li>
<li><a href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/setup-node/pull/1325">actions/setup-node#1325</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/actions/setup-node/compare/v4...v5.0.0">https://github.com/actions/setup-node/compare/v4...v5.0.0</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/actions/setup-node/commit/a0853c24544627f65ddf259abe73b1d18a591444"><code>a0853c2</code></a>
Bump actions/checkout from 4 to 5 (<a
href="https://redirect.github.com/actions/setup-node/issues/1345">#1345</a>)</li>
<li><a
href="https://github.com/actions/setup-node/commit/b7234cc9fe124f0f4932554b4e5284543083ae7b"><code>b7234cc</code></a>
Upgrade action to use node24 (<a
href="https://redirect.github.com/actions/setup-node/issues/1325">#1325</a>)</li>
<li><a
href="https://github.com/actions/setup-node/commit/d7a11313b581b306c961b506cfc8971208bb03f6"><code>d7a1131</code></a>
Enhance caching in setup-node with automatic package manager detection
(<a
href="https://redirect.github.com/actions/setup-node/issues/1348">#1348</a>)</li>
<li><a
href="https://github.com/actions/setup-node/commit/5e2628c959b9ade56971c0afcebbe5332d44b398"><code>5e2628c</code></a>
Bumps form-data (<a
href="https://redirect.github.com/actions/setup-node/issues/1332">#1332</a>)</li>
<li><a
href="https://github.com/actions/setup-node/commit/65beceff8e91358525397bdce9103d999507ab03"><code>65becef</code></a>
Bump undici from 5.28.5 to 5.29.0 (<a
href="https://redirect.github.com/actions/setup-node/issues/1295">#1295</a>)</li>
<li><a
href="https://github.com/actions/setup-node/commit/7e24a656e1c7a0d6f3eaef8d8e84ae379a5b035b"><code>7e24a65</code></a>
Bump uuid from 9.0.1 to 11.1.0 (<a
href="https://redirect.github.com/actions/setup-node/issues/1273">#1273</a>)</li>
<li><a
href="https://github.com/actions/setup-node/commit/08f58d1471bff7f3a07d167b4ad7df25d5fcfcb6"><code>08f58d1</code></a>
Bump <code>@​octokit/request-error</code> and
<code>@​actions/github</code> (<a
href="https://redirect.github.com/actions/setup-node/issues/1227">#1227</a>)</li>
<li>See full diff in <a
href="https://github.com/actions/setup-node/compare/49933ea5288caeca8642d1e84afbd3f7d6820020...a0853c24544627f65ddf259abe73b1d18a591444">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=actions/setup-node&package-manager=github_actions&previous-version=4.4.0&new-version=5.0.0)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/pre-commit.yml    | 2 +-
 .github/workflows/ui-unit-tests.yml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/pre-commit.yml b/.github/workflows/pre-commit.yml
index 5f13620f7..27db5fbe7 100644
--- a/.github/workflows/pre-commit.yml
+++ b/.github/workflows/pre-commit.yml
@@ -37,7 +37,7 @@ jobs:
             .pre-commit-config.yaml
 
       - name: Set up Node.js
-        uses: actions/setup-node@49933ea5288caeca8642d1e84afbd3f7d6820020 # v4.4.0
+        uses: actions/setup-node@a0853c24544627f65ddf259abe73b1d18a591444 # v5.0.0
         with:
           node-version: '20'
           cache: 'npm'
diff --git a/.github/workflows/ui-unit-tests.yml b/.github/workflows/ui-unit-tests.yml
index 2afb92bee..c16f512d1 100644
--- a/.github/workflows/ui-unit-tests.yml
+++ b/.github/workflows/ui-unit-tests.yml
@@ -29,7 +29,7 @@ jobs:
         uses: actions/checkout@08c6903cd8c0fde910a37f88322edcfb5dd907a8 # v5.0.0
 
       - name: Setup Node.js
-        uses: actions/setup-node@49933ea5288caeca8642d1e84afbd3f7d6820020 # v4.4.0
+        uses: actions/setup-node@a0853c24544627f65ddf259abe73b1d18a591444 # v5.0.0
         with:
           node-version: ${{ matrix.node-version }}
           cache: 'npm'

From d458817af51a59b1f00c0860a3d8a9d9418153a0 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 10:05:34 +0200
Subject: [PATCH 38/76] chore(github-deps): bump actions/setup-python from
 5.6.0 to 6.0.0 (#3354)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps [actions/setup-python](https://github.com/actions/setup-python)
from 5.6.0 to 6.0.0.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/actions/setup-python/releases">actions/setup-python's
releases</a>.</em></p>
<blockquote>
<h2>v6.0.0</h2>
<h2>What's Changed</h2>
<h3>Breaking Changes</h3>
<ul>
<li>Upgrade to node 24 by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/setup-python/pull/1164">actions/setup-python#1164</a></li>
</ul>
<p>Make sure your runner is on version v2.327.1 or later to ensure
compatibility with this release. <a
href="https://github.com/actions/runner/releases/tag/v2.327.1">See
Release Notes</a></p>
<h3>Enhancements:</h3>
<ul>
<li>Add support for <code>pip-version</code> by <a
href="https://github.com/priyagupta108"><code>@​priyagupta108</code></a>
in <a
href="https://redirect.github.com/actions/setup-python/pull/1129">actions/setup-python#1129</a></li>
<li>Enhance reading from .python-version by <a
href="https://github.com/krystof-k"><code>@​krystof-k</code></a> in <a
href="https://redirect.github.com/actions/setup-python/pull/787">actions/setup-python#787</a></li>
<li>Add version parsing from Pipfile by <a
href="https://github.com/aradkdj"><code>@​aradkdj</code></a> in <a
href="https://redirect.github.com/actions/setup-python/pull/1067">actions/setup-python#1067</a></li>
</ul>
<h3>Bug fixes:</h3>
<ul>
<li>Clarify pythonLocation behaviour for PyPy and GraalPy in environment
variables by <a
href="https://github.com/aparnajyothi-y"><code>@​aparnajyothi-y</code></a>
in <a
href="https://redirect.github.com/actions/setup-python/pull/1183">actions/setup-python#1183</a></li>
<li>Change missing cache directory error to warning by <a
href="https://github.com/aparnajyothi-y"><code>@​aparnajyothi-y</code></a>
in <a
href="https://redirect.github.com/actions/setup-python/pull/1182">actions/setup-python#1182</a></li>
<li>Add Architecture-Specific PATH Management for Python with --user
Flag on Windows by <a
href="https://github.com/aparnajyothi-y"><code>@​aparnajyothi-y</code></a>
in <a
href="https://redirect.github.com/actions/setup-python/pull/1122">actions/setup-python#1122</a></li>
<li>Include python version in PyPy python-version output by <a
href="https://github.com/cdce8p"><code>@​cdce8p</code></a> in <a
href="https://redirect.github.com/actions/setup-python/pull/1110">actions/setup-python#1110</a></li>
<li>Update docs: clarification on pip authentication with setup-python
by <a
href="https://github.com/priya-kinthali"><code>@​priya-kinthali</code></a>
in <a
href="https://redirect.github.com/actions/setup-python/pull/1156">actions/setup-python#1156</a></li>
</ul>
<h3>Dependency updates:</h3>
<ul>
<li>Upgrade idna from 2.9 to 3.7 in /<strong>tests</strong>/data by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/setup-python/pull/843">actions/setup-python#843</a></li>
<li>Upgrade form-data to fix critical vulnerabilities <a
href="https://redirect.github.com/actions/setup-python/issues/182">#182</a>
&amp; <a
href="https://redirect.github.com/actions/setup-python/issues/183">#183</a>
by <a
href="https://github.com/aparnajyothi-y"><code>@​aparnajyothi-y</code></a>
in <a
href="https://redirect.github.com/actions/setup-python/pull/1163">actions/setup-python#1163</a></li>
<li>Upgrade setuptools to 78.1.1 to fix path traversal vulnerability in
PackageIndex.download by <a
href="https://github.com/aparnajyothi-y"><code>@​aparnajyothi-y</code></a>
in <a
href="https://redirect.github.com/actions/setup-python/pull/1165">actions/setup-python#1165</a></li>
<li>Upgrade actions/checkout from 4 to 5 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/setup-python/pull/1181">actions/setup-python#1181</a></li>
<li>Upgrade <code>@​actions/tool-cache</code> from 2.0.1 to 2.0.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>[bot]
in <a
href="https://redirect.github.com/actions/setup-python/pull/1095">actions/setup-python#1095</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/krystof-k"><code>@​krystof-k</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/setup-python/pull/787">actions/setup-python#787</a></li>
<li><a href="https://github.com/cdce8p"><code>@​cdce8p</code></a> made
their first contribution in <a
href="https://redirect.github.com/actions/setup-python/pull/1110">actions/setup-python#1110</a></li>
<li><a href="https://github.com/aradkdj"><code>@​aradkdj</code></a> made
their first contribution in <a
href="https://redirect.github.com/actions/setup-python/pull/1067">actions/setup-python#1067</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/actions/setup-python/compare/v5...v6.0.0">https://github.com/actions/setup-python/compare/v5...v6.0.0</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/actions/setup-python/commit/e797f83bcb11b83ae66e0230d6156d7c80228e7c"><code>e797f83</code></a>
Upgrade to node 24 (<a
href="https://redirect.github.com/actions/setup-python/issues/1164">#1164</a>)</li>
<li><a
href="https://github.com/actions/setup-python/commit/3d1e2d2ca0a067f27da6fec484fce7f5256def85"><code>3d1e2d2</code></a>
Revert &quot;Enhance cache-dependency-path handling to support files
outside the w...</li>
<li><a
href="https://github.com/actions/setup-python/commit/65b071217a8539818fdb8b54561bcbae40380a54"><code>65b0712</code></a>
Clarify pythonLocation behavior for PyPy and GraalPy in environment
variables...</li>
<li><a
href="https://github.com/actions/setup-python/commit/5b668cf7652160527499ee14ceaff4be9306cb88"><code>5b668cf</code></a>
Bump actions/checkout from 4 to 5 (<a
href="https://redirect.github.com/actions/setup-python/issues/1181">#1181</a>)</li>
<li><a
href="https://github.com/actions/setup-python/commit/f62a0e252fe7114e86949abfa6e1e89f85bb38c2"><code>f62a0e2</code></a>
Change missing cache directory error to warning (<a
href="https://redirect.github.com/actions/setup-python/issues/1182">#1182</a>)</li>
<li><a
href="https://github.com/actions/setup-python/commit/9322b3ca74000aeb2c01eb777b646334015ddd72"><code>9322b3c</code></a>
Upgrade setuptools to 78.1.1 to fix path traversal vulnerability in
PackageIn...</li>
<li><a
href="https://github.com/actions/setup-python/commit/fbeb884f69f0ac1c0257302f62aa524c2824b649"><code>fbeb884</code></a>
Bump form-data to fix critical vulnerabilities <a
href="https://redirect.github.com/actions/setup-python/issues/182">#182</a>
&amp; <a
href="https://redirect.github.com/actions/setup-python/issues/183">#183</a>
(<a
href="https://redirect.github.com/actions/setup-python/issues/1163">#1163</a>)</li>
<li><a
href="https://github.com/actions/setup-python/commit/03bb6152f4f691b9d64579a1bd791904a083c452"><code>03bb615</code></a>
Bump idna from 2.9 to 3.7 in /<strong>tests</strong>/data (<a
href="https://redirect.github.com/actions/setup-python/issues/843">#843</a>)</li>
<li><a
href="https://github.com/actions/setup-python/commit/36da51d563b70a972897150555bb025096d65565"><code>36da51d</code></a>
Add version parsing from Pipfile (<a
href="https://redirect.github.com/actions/setup-python/issues/1067">#1067</a>)</li>
<li><a
href="https://github.com/actions/setup-python/commit/3c6f142cc0036d53007e92fa1e327564a4cfb7aa"><code>3c6f142</code></a>
update documentation (<a
href="https://redirect.github.com/actions/setup-python/issues/1156">#1156</a>)</li>
<li>Additional commits viewable in <a
href="https://github.com/actions/setup-python/compare/a26af69be951a213d495a4c3e4e4022e16d87065...e797f83bcb11b83ae66e0230d6156d7c80228e7c">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=actions/setup-python&package-manager=github_actions&previous-version=5.6.0&new-version=6.0.0)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/pre-commit.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/pre-commit.yml b/.github/workflows/pre-commit.yml
index 27db5fbe7..792162262 100644
--- a/.github/workflows/pre-commit.yml
+++ b/.github/workflows/pre-commit.yml
@@ -28,7 +28,7 @@ jobs:
           fetch-depth: ${{ github.actor == 'dependabot[bot]' && 0 || 1 }}
 
       - name: Set up Python
-        uses: actions/setup-python@a26af69be951a213d495a4c3e4e4022e16d87065 # v5.6.0
+        uses: actions/setup-python@e797f83bcb11b83ae66e0230d6156d7c80228e7c # v6.0.0
         with:
           python-version: '3.12'
           cache: pip

From 44e1a405950f773354ae06c7062ce146f3ea8219 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 10:07:03 +0200
Subject: [PATCH 39/76] chore(github-deps): bump actions/checkout from 4.1.7 to
 5.0.0 (#3357)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

[//]: # (dependabot-start)
⚠️  **Dependabot is rebasing this PR** ⚠️

Rebasing might not happen immediately, so don't worry if this takes some
time.

Note: if you make any changes to this PR yourself, they will take
precedence over the rebase.

---

[//]: # (dependabot-end)

Bumps [actions/checkout](https://github.com/actions/checkout) from 4.1.7
to 5.0.0.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/actions/checkout/releases">actions/checkout's
releases</a>.</em></p>
<blockquote>
<h2>v5.0.0</h2>
<h2>What's Changed</h2>
<ul>
<li>Update actions checkout to use node 24 by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2226">actions/checkout#2226</a></li>
<li>Prepare v5.0.0 release by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2238">actions/checkout#2238</a></li>
</ul>
<h2>⚠️ Minimum Compatible Runner Version</h2>
<p><strong>v2.327.1</strong><br />
<a
href="https://github.com/actions/runner/releases/tag/v2.327.1">Release
Notes</a></p>
<p>Make sure your runner is updated to this version or newer to use this
release.</p>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/actions/checkout/compare/v4...v5.0.0">https://github.com/actions/checkout/compare/v4...v5.0.0</a></p>
<h2>v4.3.0</h2>
<h2>What's Changed</h2>
<ul>
<li>docs: update README.md by <a
href="https://github.com/motss"><code>@​motss</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1971">actions/checkout#1971</a></li>
<li>Add internal repos for checking out multiple repositories by <a
href="https://github.com/mouismail"><code>@​mouismail</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1977">actions/checkout#1977</a></li>
<li>Documentation update - add recommended permissions to Readme by <a
href="https://github.com/benwells"><code>@​benwells</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2043">actions/checkout#2043</a></li>
<li>Adjust positioning of user email note and permissions heading by <a
href="https://github.com/joshmgross"><code>@​joshmgross</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2044">actions/checkout#2044</a></li>
<li>Update README.md by <a
href="https://github.com/nebuk89"><code>@​nebuk89</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2194">actions/checkout#2194</a></li>
<li>Update CODEOWNERS for actions by <a
href="https://github.com/TingluoHuang"><code>@​TingluoHuang</code></a>
in <a
href="https://redirect.github.com/actions/checkout/pull/2224">actions/checkout#2224</a></li>
<li>Update package dependencies by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2236">actions/checkout#2236</a></li>
<li>Prepare release v4.3.0 by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2237">actions/checkout#2237</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/motss"><code>@​motss</code></a> made
their first contribution in <a
href="https://redirect.github.com/actions/checkout/pull/1971">actions/checkout#1971</a></li>
<li><a href="https://github.com/mouismail"><code>@​mouismail</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/checkout/pull/1977">actions/checkout#1977</a></li>
<li><a href="https://github.com/benwells"><code>@​benwells</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/checkout/pull/2043">actions/checkout#2043</a></li>
<li><a href="https://github.com/nebuk89"><code>@​nebuk89</code></a> made
their first contribution in <a
href="https://redirect.github.com/actions/checkout/pull/2194">actions/checkout#2194</a></li>
<li><a href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/checkout/pull/2236">actions/checkout#2236</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/actions/checkout/compare/v4...v4.3.0">https://github.com/actions/checkout/compare/v4...v4.3.0</a></p>
<h2>v4.2.2</h2>
<h2>What's Changed</h2>
<ul>
<li><code>url-helper.ts</code> now leverages well-known environment
variables by <a href="https://github.com/jww3"><code>@​jww3</code></a>
in <a
href="https://redirect.github.com/actions/checkout/pull/1941">actions/checkout#1941</a></li>
<li>Expand unit test coverage for <code>isGhes</code> by <a
href="https://github.com/jww3"><code>@​jww3</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1946">actions/checkout#1946</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/actions/checkout/compare/v4.2.1...v4.2.2">https://github.com/actions/checkout/compare/v4.2.1...v4.2.2</a></p>
<h2>v4.2.1</h2>
<h2>What's Changed</h2>
<ul>
<li>Check out other refs/* by commit if provided, fall back to ref by <a
href="https://github.com/orhantoy"><code>@​orhantoy</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1924">actions/checkout#1924</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/Jcambass"><code>@​Jcambass</code></a>
made their first contribution in <a
href="https://redirect.github.com/actions/checkout/pull/1919">actions/checkout#1919</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/actions/checkout/compare/v4.2.0...v4.2.1">https://github.com/actions/checkout/compare/v4.2.0...v4.2.1</a></p>
<!-- raw HTML omitted -->
</blockquote>
<p>... (truncated)</p>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a
href="https://github.com/actions/checkout/blob/main/CHANGELOG.md">actions/checkout's
changelog</a>.</em></p>
<blockquote>
<h1>Changelog</h1>
<h2>V5.0.0</h2>
<ul>
<li>Update actions checkout to use node 24 by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2226">actions/checkout#2226</a></li>
</ul>
<h2>V4.3.0</h2>
<ul>
<li>docs: update README.md by <a
href="https://github.com/motss"><code>@​motss</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1971">actions/checkout#1971</a></li>
<li>Add internal repos for checking out multiple repositories by <a
href="https://github.com/mouismail"><code>@​mouismail</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1977">actions/checkout#1977</a></li>
<li>Documentation update - add recommended permissions to Readme by <a
href="https://github.com/benwells"><code>@​benwells</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2043">actions/checkout#2043</a></li>
<li>Adjust positioning of user email note and permissions heading by <a
href="https://github.com/joshmgross"><code>@​joshmgross</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2044">actions/checkout#2044</a></li>
<li>Update README.md by <a
href="https://github.com/nebuk89"><code>@​nebuk89</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2194">actions/checkout#2194</a></li>
<li>Update CODEOWNERS for actions by <a
href="https://github.com/TingluoHuang"><code>@​TingluoHuang</code></a>
in <a
href="https://redirect.github.com/actions/checkout/pull/2224">actions/checkout#2224</a></li>
<li>Update package dependencies by <a
href="https://github.com/salmanmkc"><code>@​salmanmkc</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/2236">actions/checkout#2236</a></li>
</ul>
<h2>v4.2.2</h2>
<ul>
<li><code>url-helper.ts</code> now leverages well-known environment
variables by <a href="https://github.com/jww3"><code>@​jww3</code></a>
in <a
href="https://redirect.github.com/actions/checkout/pull/1941">actions/checkout#1941</a></li>
<li>Expand unit test coverage for <code>isGhes</code> by <a
href="https://github.com/jww3"><code>@​jww3</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1946">actions/checkout#1946</a></li>
</ul>
<h2>v4.2.1</h2>
<ul>
<li>Check out other refs/* by commit if provided, fall back to ref by <a
href="https://github.com/orhantoy"><code>@​orhantoy</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1924">actions/checkout#1924</a></li>
</ul>
<h2>v4.2.0</h2>
<ul>
<li>Add Ref and Commit outputs by <a
href="https://github.com/lucacome"><code>@​lucacome</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1180">actions/checkout#1180</a></li>
<li>Dependency updates by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a>- <a
href="https://redirect.github.com/actions/checkout/pull/1777">actions/checkout#1777</a>,
<a
href="https://redirect.github.com/actions/checkout/pull/1872">actions/checkout#1872</a></li>
</ul>
<h2>v4.1.7</h2>
<ul>
<li>Bump the minor-npm-dependencies group across 1 directory with 4
updates by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1739">actions/checkout#1739</a></li>
<li>Bump actions/checkout from 3 to 4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1697">actions/checkout#1697</a></li>
<li>Check out other refs/* by commit by <a
href="https://github.com/orhantoy"><code>@​orhantoy</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1774">actions/checkout#1774</a></li>
<li>Pin actions/checkout's own workflows to a known, good, stable
version. by <a href="https://github.com/jww3"><code>@​jww3</code></a> in
<a
href="https://redirect.github.com/actions/checkout/pull/1776">actions/checkout#1776</a></li>
</ul>
<h2>v4.1.6</h2>
<ul>
<li>Check platform to set archive extension appropriately by <a
href="https://github.com/cory-miller"><code>@​cory-miller</code></a> in
<a
href="https://redirect.github.com/actions/checkout/pull/1732">actions/checkout#1732</a></li>
</ul>
<h2>v4.1.5</h2>
<ul>
<li>Update NPM dependencies by <a
href="https://github.com/cory-miller"><code>@​cory-miller</code></a> in
<a
href="https://redirect.github.com/actions/checkout/pull/1703">actions/checkout#1703</a></li>
<li>Bump github/codeql-action from 2 to 3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1694">actions/checkout#1694</a></li>
<li>Bump actions/setup-node from 1 to 4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1696">actions/checkout#1696</a></li>
<li>Bump actions/upload-artifact from 2 to 4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1695">actions/checkout#1695</a></li>
<li>README: Suggest <code>user.email</code> to be
<code>41898282+github-actions[bot]@users.noreply.github.com</code> by <a
href="https://github.com/cory-miller"><code>@​cory-miller</code></a> in
<a
href="https://redirect.github.com/actions/checkout/pull/1707">actions/checkout#1707</a></li>
</ul>
<h2>v4.1.4</h2>
<ul>
<li>Disable <code>extensions.worktreeConfig</code> when disabling
<code>sparse-checkout</code> by <a
href="https://github.com/jww3"><code>@​jww3</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1692">actions/checkout#1692</a></li>
<li>Add dependabot config by <a
href="https://github.com/cory-miller"><code>@​cory-miller</code></a> in
<a
href="https://redirect.github.com/actions/checkout/pull/1688">actions/checkout#1688</a></li>
<li>Bump the minor-actions-dependencies group with 2 updates by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1693">actions/checkout#1693</a></li>
<li>Bump word-wrap from 1.2.3 to 1.2.5 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a
href="https://redirect.github.com/actions/checkout/pull/1643">actions/checkout#1643</a></li>
</ul>
<h2>v4.1.3</h2>
<!-- raw HTML omitted -->
</blockquote>
<p>... (truncated)</p>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/actions/checkout/commit/08c6903cd8c0fde910a37f88322edcfb5dd907a8"><code>08c6903</code></a>
Prepare v5.0.0 release (<a
href="https://redirect.github.com/actions/checkout/issues/2238">#2238</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/9f265659d3bb64ab1440b03b12f4d47a24320917"><code>9f26565</code></a>
Update actions checkout to use node 24 (<a
href="https://redirect.github.com/actions/checkout/issues/2226">#2226</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/08eba0b27e820071cde6df949e0beb9ba4906955"><code>08eba0b</code></a>
Prepare release v4.3.0 (<a
href="https://redirect.github.com/actions/checkout/issues/2237">#2237</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/631c7dc4f80f88219c5ee78fee08c6b62fac8da1"><code>631c7dc</code></a>
Update package dependencies (<a
href="https://redirect.github.com/actions/checkout/issues/2236">#2236</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/8edcb1bdb4e267140fa742c62e395cd74f332709"><code>8edcb1b</code></a>
Update CODEOWNERS for actions (<a
href="https://redirect.github.com/actions/checkout/issues/2224">#2224</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/09d2acae674a48949e3602304ab46fd20ae0c42f"><code>09d2aca</code></a>
Update README.md (<a
href="https://redirect.github.com/actions/checkout/issues/2194">#2194</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/85e6279cec87321a52edac9c87bce653a07cf6c2"><code>85e6279</code></a>
Adjust positioning of user email note and permissions heading (<a
href="https://redirect.github.com/actions/checkout/issues/2044">#2044</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/009b9ae9e446ad8d9b8c809870b0fbcc5e03573e"><code>009b9ae</code></a>
Documentation update - add recommended permissions to Readme (<a
href="https://redirect.github.com/actions/checkout/issues/2043">#2043</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/cbb722410c2e876e24abbe8de2cc27693e501dcb"><code>cbb7224</code></a>
Update README.md (<a
href="https://redirect.github.com/actions/checkout/issues/1977">#1977</a>)</li>
<li><a
href="https://github.com/actions/checkout/commit/3b9b8c884f6b4bb4d5be2779c26374abadae0871"><code>3b9b8c8</code></a>
docs: update README.md (<a
href="https://redirect.github.com/actions/checkout/issues/1971">#1971</a>)</li>
<li>Additional commits viewable in <a
href="https://github.com/actions/checkout/compare/v4.1.7...08c6903cd8c0fde910a37f88322edcfb5dd907a8">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=actions/checkout&package-manager=github_actions&previous-version=4.1.7&new-version=5.0.0)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/conformance.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/conformance.yml b/.github/workflows/conformance.yml
index 2433b0203..c0a7795a3 100644
--- a/.github/workflows/conformance.yml
+++ b/.github/workflows/conformance.yml
@@ -33,12 +33,12 @@ jobs:
       # Using specific version 4.1.7 because 5.0.0 fails when trying to run this locally using `act`
       # This ensures consistent behavior between local testing and CI
       - name: Checkout PR Code
-        uses: actions/checkout@692973e3d937129bcbf40652eb9f2f61becf3332 # v4.1.7
+        uses: actions/checkout@08c6903cd8c0fde910a37f88322edcfb5dd907a8 # v5.0.0
 
       # Checkout the base branch to compare against (usually main)
       # This allows us to diff the current changes against the previous state
       - name: Checkout Base Branch
-        uses: actions/checkout@692973e3d937129bcbf40652eb9f2f61becf3332 # v4.1.7
+        uses: actions/checkout@08c6903cd8c0fde910a37f88322edcfb5dd907a8 # v5.0.0
         with:
           ref: ${{ github.event.pull_request.base.ref }}
           path: 'base'

From 072dca0609c55205cd8a8ada5a727c631ce0cc3b Mon Sep 17 00:00:00 2001
From: Akram Ben Aissi <akram.benaissi@gmail.com>
Date: Mon, 8 Sep 2025 11:25:10 +0200
Subject: [PATCH 40/76] feat: Add Kubernetes  auth provider to use
 SelfSubjectReview and kubernetes api server (#2559)

# What does this PR do?
Add Kubernetes authentication provider support
- Add KubernetesAuthProvider class for token validation using Kubernetes
SelfSubjectReview API
- Add KubernetesAuthProviderConfig with configurable API server URL, TLS
settings, and claims mapping
- Implement authentication via POST requests to
/apis/authentication.k8s.io/v1/selfsubjectreviews endpoint
- Add support for parsing Kubernetes SelfSubjectReview response format
to extract user information
- Add KUBERNETES provider type to AuthProviderType enum
- Update create_auth_provider factory function to handle 'kubernetes'
provider type
- Add comprehensive unit tests for KubernetesAuthProvider functionality
- Add documentation with configuration examples and usage instructions

The provider validates tokens by sending SelfSubjectReview requests to
the Kubernetes API server and extracts user information from the
userInfo structure in the response.


<!-- If resolving an issue, uncomment and update the line below -->
<!-- Closes #[issue-number] -->

## Test Plan
<!-- Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.* -->
What This Verifies:
Authentication header validation
Token validation with Kubernetes SelfSubjectReview and kubernetes server
API endpoint
Error handling for invalid tokens and HTTP errors
Request payload structure and headers

```
python -m pytest tests/unit/server/test_auth.py -k "kubernetes" -v
```

Signed-off-by: Akram Ben Aissi <akram.benaissi@gmail.com>
---
 docs/source/distributions/configuration.md |  41 +++++++
 llama_stack/apis/common/errors.py          |   7 ++
 llama_stack/core/datatypes.py              |  41 ++++++-
 llama_stack/core/server/auth_providers.py  |  93 +++++++++++++-
 tests/unit/server/test_auth.py             | 133 +++++++++++++++++++++
 5 files changed, 311 insertions(+), 4 deletions(-)

diff --git a/docs/source/distributions/configuration.md b/docs/source/distributions/configuration.md
index c9677b3b6..452c3d95f 100644
--- a/docs/source/distributions/configuration.md
+++ b/docs/source/distributions/configuration.md
@@ -354,6 +354,47 @@ You can easily validate a request by running:
 curl -s -L -H "Authorization: Bearer $(cat llama-stack-auth-token)" http://127.0.0.1:8321/v1/providers
 ```
 
+#### Kubernetes Authentication Provider
+
+The server can be configured to use Kubernetes SelfSubjectReview API to validate tokens directly against the Kubernetes API server:
+
+```yaml
+server:
+  auth:
+    provider_config:
+      type: "kubernetes"
+      api_server_url: "https://kubernetes.default.svc"
+      claims_mapping:
+        username: "roles"
+        groups: "roles"
+        uid: "uid_attr"
+      verify_tls: true
+      tls_cafile: "/path/to/ca.crt"
+```
+
+Configuration options:
+- `api_server_url`: The Kubernetes API server URL (e.g., https://kubernetes.default.svc:6443)
+- `verify_tls`: Whether to verify TLS certificates (default: true)
+- `tls_cafile`: Path to CA certificate file for TLS verification
+- `claims_mapping`: Mapping of Kubernetes user claims to access attributes
+
+The provider validates tokens by sending a SelfSubjectReview request to the Kubernetes API server at `/apis/authentication.k8s.io/v1/selfsubjectreviews`. The provider extracts user information from the response:
+- Username from the `userInfo.username` field
+- Groups from the `userInfo.groups` field
+- UID from the `userInfo.uid` field
+
+To obtain a token for testing:
+```bash
+kubectl create namespace llama-stack
+kubectl create serviceaccount llama-stack-auth -n llama-stack
+kubectl create token llama-stack-auth -n llama-stack > llama-stack-auth-token
+```
+
+You can validate a request by running:
+```bash
+curl -s -L -H "Authorization: Bearer $(cat llama-stack-auth-token)" http://127.0.0.1:8321/v1/providers
+```
+
 #### GitHub Token Provider
 Validates GitHub personal access tokens or OAuth tokens directly:
 ```yaml
diff --git a/llama_stack/apis/common/errors.py b/llama_stack/apis/common/errors.py
index ec3d2b1ce..4c9c0a818 100644
--- a/llama_stack/apis/common/errors.py
+++ b/llama_stack/apis/common/errors.py
@@ -79,3 +79,10 @@ class ConflictError(ValueError):
 
     def __init__(self, message: str) -> None:
         super().__init__(message)
+
+
+class TokenValidationError(ValueError):
+    """raised when token validation fails during authentication"""
+
+    def __init__(self, message: str) -> None:
+        super().__init__(message)
diff --git a/llama_stack/core/datatypes.py b/llama_stack/core/datatypes.py
index c3940fcbd..0f348b067 100644
--- a/llama_stack/core/datatypes.py
+++ b/llama_stack/core/datatypes.py
@@ -7,6 +7,7 @@
 from enum import StrEnum
 from pathlib import Path
 from typing import Annotated, Any, Literal, Self
+from urllib.parse import urlparse
 
 from pydantic import BaseModel, Field, field_validator, model_validator
 
@@ -212,6 +213,7 @@ class AuthProviderType(StrEnum):
     OAUTH2_TOKEN = "oauth2_token"
     GITHUB_TOKEN = "github_token"
     CUSTOM = "custom"
+    KUBERNETES = "kubernetes"
 
 
 class OAuth2TokenAuthConfig(BaseModel):
@@ -282,8 +284,45 @@ class GitHubTokenAuthConfig(BaseModel):
     )
 
 
+class KubernetesAuthProviderConfig(BaseModel):
+    """Configuration for Kubernetes authentication provider."""
+
+    type: Literal[AuthProviderType.KUBERNETES] = AuthProviderType.KUBERNETES
+    api_server_url: str = Field(
+        default="https://kubernetes.default.svc",
+        description="Kubernetes API server URL (e.g., https://api.cluster.domain:6443)",
+    )
+    verify_tls: bool = Field(default=True, description="Whether to verify TLS certificates")
+    tls_cafile: Path | None = Field(default=None, description="Path to CA certificate file for TLS verification")
+    claims_mapping: dict[str, str] = Field(
+        default_factory=lambda: {
+            "username": "roles",
+            "groups": "roles",
+        },
+        description="Mapping of Kubernetes user claims to access attributes",
+    )
+
+    @field_validator("api_server_url")
+    @classmethod
+    def validate_api_server_url(cls, v):
+        parsed = urlparse(v)
+        if not parsed.scheme or not parsed.netloc:
+            raise ValueError(f"api_server_url must be a valid URL with scheme and host: {v}")
+        if parsed.scheme not in ["http", "https"]:
+            raise ValueError(f"api_server_url scheme must be http or https: {v}")
+        return v
+
+    @field_validator("claims_mapping")
+    @classmethod
+    def validate_claims_mapping(cls, v):
+        for key, value in v.items():
+            if not value:
+                raise ValueError(f"claims_mapping value cannot be empty: {key}")
+        return v
+
+
 AuthProviderConfig = Annotated[
-    OAuth2TokenAuthConfig | GitHubTokenAuthConfig | CustomAuthConfig,
+    OAuth2TokenAuthConfig | GitHubTokenAuthConfig | CustomAuthConfig | KubernetesAuthProviderConfig,
     Field(discriminator="type"),
 ]
 
diff --git a/llama_stack/core/server/auth_providers.py b/llama_stack/core/server/auth_providers.py
index a8af6f75a..38188c49a 100644
--- a/llama_stack/core/server/auth_providers.py
+++ b/llama_stack/core/server/auth_providers.py
@@ -8,16 +8,18 @@ import ssl
 import time
 from abc import ABC, abstractmethod
 from asyncio import Lock
-from urllib.parse import parse_qs, urlparse
+from urllib.parse import parse_qs, urljoin, urlparse
 
 import httpx
 from jose import jwt
 from pydantic import BaseModel, Field
 
+from llama_stack.apis.common.errors import TokenValidationError
 from llama_stack.core.datatypes import (
     AuthenticationConfig,
     CustomAuthConfig,
     GitHubTokenAuthConfig,
+    KubernetesAuthProviderConfig,
     OAuth2TokenAuthConfig,
     User,
 )
@@ -162,7 +164,7 @@ class OAuth2TokenAuthProvider(AuthProvider):
                     auth=auth,
                     timeout=10.0,  # Add a reasonable timeout
                 )
-                if response.status_code != 200:
+                if response.status_code != httpx.codes.OK:
                     logger.warning(f"Token introspection failed with status code: {response.status_code}")
                     raise ValueError(f"Token introspection failed: {response.status_code}")
 
@@ -272,7 +274,7 @@ class CustomAuthProvider(AuthProvider):
                     json=auth_request.model_dump(),
                     timeout=10.0,  # Add a reasonable timeout
                 )
-                if response.status_code != 200:
+                if response.status_code != httpx.codes.OK:
                     logger.warning(f"Authentication failed with status code: {response.status_code}")
                     raise ValueError(f"Authentication failed: {response.status_code}")
 
@@ -374,6 +376,89 @@ async def _get_github_user_info(access_token: str, github_api_base_url: str) ->
         }
 
 
+class KubernetesAuthProvider(AuthProvider):
+    """
+    Kubernetes authentication provider that validates tokens using the Kubernetes SelfSubjectReview API.
+    This provider integrates with Kubernetes API server by using the
+    /apis/authentication.k8s.io/v1/selfsubjectreviews endpoint to validate tokens and extract user information.
+    """
+
+    def __init__(self, config: KubernetesAuthProviderConfig):
+        self.config = config
+
+    def _httpx_verify_value(self) -> bool | str:
+        """
+        Build the value for httpx's `verify` parameter.
+        - False disables verification.
+        - Path string points to a CA bundle.
+        - True uses system defaults.
+        """
+        if not self.config.verify_tls:
+            return False
+        if self.config.tls_cafile:
+            return self.config.tls_cafile.as_posix()
+        return True
+
+    async def validate_token(self, token: str, scope: dict | None = None) -> User:
+        """Validate a token using Kubernetes SelfSubjectReview API endpoint."""
+        # Build the Kubernetes SelfSubjectReview API endpoint URL
+        review_api_url = urljoin(self.config.api_server_url, "/apis/authentication.k8s.io/v1/selfsubjectreviews")
+
+        # Create SelfSubjectReview request body
+        review_request = {"apiVersion": "authentication.k8s.io/v1", "kind": "SelfSubjectReview"}
+        verify = self._httpx_verify_value()
+
+        try:
+            async with httpx.AsyncClient(verify=verify, timeout=10.0) as client:
+                response = await client.post(
+                    review_api_url,
+                    json=review_request,
+                    headers={
+                        "Authorization": f"Bearer {token}",
+                        "Content-Type": "application/json",
+                    },
+                )
+
+                if response.status_code == httpx.codes.UNAUTHORIZED:
+                    raise TokenValidationError("Invalid token")
+                if response.status_code != httpx.codes.CREATED:
+                    logger.warning(f"Kubernetes SelfSubjectReview API failed with status code: {response.status_code}")
+                    raise TokenValidationError(f"Token validation failed: {response.status_code}")
+
+                review_response = response.json()
+                # Extract user information from SelfSubjectReview response
+                status = review_response.get("status", {})
+                if not status:
+                    raise ValueError("No status found in SelfSubjectReview response")
+
+                user_info = status.get("userInfo", {})
+                if not user_info:
+                    raise ValueError("No userInfo found in SelfSubjectReview response")
+
+                username = user_info.get("username")
+                if not username:
+                    raise ValueError("No username found in SelfSubjectReview response")
+
+                # Build user attributes from Kubernetes user info
+                user_attributes = get_attributes_from_claims(user_info, self.config.claims_mapping)
+
+                return User(
+                    principal=username,
+                    attributes=user_attributes,
+                )
+
+        except httpx.TimeoutException:
+            logger.warning("Kubernetes SelfSubjectReview API request timed out")
+            raise ValueError("Token validation timeout") from None
+        except Exception as e:
+            logger.warning(f"Error during token validation: {str(e)}")
+            raise ValueError(f"Token validation error: {str(e)}") from e
+
+    async def close(self):
+        """Close any resources."""
+        pass
+
+
 def create_auth_provider(config: AuthenticationConfig) -> AuthProvider:
     """Factory function to create the appropriate auth provider."""
     provider_config = config.provider_config
@@ -384,5 +469,7 @@ def create_auth_provider(config: AuthenticationConfig) -> AuthProvider:
         return OAuth2TokenAuthProvider(provider_config)
     elif isinstance(provider_config, GitHubTokenAuthConfig):
         return GitHubTokenAuthProvider(provider_config)
+    elif isinstance(provider_config, KubernetesAuthProviderConfig):
+        return KubernetesAuthProvider(provider_config)
     else:
         raise ValueError(f"Unknown authentication provider config type: {type(provider_config)}")
diff --git a/tests/unit/server/test_auth.py b/tests/unit/server/test_auth.py
index 37b543976..205e0ce65 100644
--- a/tests/unit/server/test_auth.py
+++ b/tests/unit/server/test_auth.py
@@ -774,3 +774,136 @@ def test_has_required_scope_function():
 
     # Test no user (auth disabled)
     assert _has_required_scope("test.read", None)
+
+
+@pytest.fixture
+def mock_kubernetes_api_server():
+    return "https://api.cluster.example.com:6443"
+
+
+@pytest.fixture
+def kubernetes_auth_app(mock_kubernetes_api_server):
+    app = FastAPI()
+    auth_config = AuthenticationConfig(
+        provider_config={
+            "type": "kubernetes",
+            "api_server_url": mock_kubernetes_api_server,
+            "verify_tls": False,
+            "claims_mapping": {
+                "username": "roles",
+                "groups": "roles",
+                "uid": "uid_attr",
+            },
+        },
+    )
+    app.add_middleware(AuthenticationMiddleware, auth_config=auth_config, impls={})
+
+    @app.get("/test")
+    def test_endpoint():
+        return {"message": "Authentication successful"}
+
+    return app
+
+
+@pytest.fixture
+def kubernetes_auth_client(kubernetes_auth_app):
+    return TestClient(kubernetes_auth_app)
+
+
+def test_missing_auth_header_kubernetes_auth(kubernetes_auth_client):
+    response = kubernetes_auth_client.get("/test")
+    assert response.status_code == 401
+    assert "Authentication required" in response.json()["error"]["message"]
+
+
+def test_invalid_auth_header_format_kubernetes_auth(kubernetes_auth_client):
+    response = kubernetes_auth_client.get("/test", headers={"Authorization": "InvalidFormat token123"})
+    assert response.status_code == 401
+    assert "Invalid Authorization header format" in response.json()["error"]["message"]
+
+
+async def mock_kubernetes_selfsubjectreview_success(*args, **kwargs):
+    return MockResponse(
+        201,
+        {
+            "apiVersion": "authentication.k8s.io/v1",
+            "kind": "SelfSubjectReview",
+            "metadata": {"creationTimestamp": "2025-07-15T13:53:56Z"},
+            "status": {
+                "userInfo": {
+                    "username": "alice",
+                    "uid": "alice-uid-123",
+                    "groups": ["system:authenticated", "developers", "admins"],
+                    "extra": {"scopes.authorization.openshift.io": ["user:full"]},
+                }
+            },
+        },
+    )
+
+
+async def mock_kubernetes_selfsubjectreview_failure(*args, **kwargs):
+    return MockResponse(401, {"message": "Unauthorized"})
+
+
+async def mock_kubernetes_selfsubjectreview_http_error(*args, **kwargs):
+    return MockResponse(500, {"message": "Internal Server Error"})
+
+
+@patch("httpx.AsyncClient.post", new=mock_kubernetes_selfsubjectreview_success)
+def test_valid_kubernetes_auth_authentication(kubernetes_auth_client, valid_token):
+    response = kubernetes_auth_client.get("/test", headers={"Authorization": f"Bearer {valid_token}"})
+    assert response.status_code == 200
+    assert response.json() == {"message": "Authentication successful"}
+
+
+@patch("httpx.AsyncClient.post", new=mock_kubernetes_selfsubjectreview_failure)
+def test_invalid_kubernetes_auth_authentication(kubernetes_auth_client, invalid_token):
+    response = kubernetes_auth_client.get("/test", headers={"Authorization": f"Bearer {invalid_token}"})
+    assert response.status_code == 401
+    assert "Invalid token" in response.json()["error"]["message"]
+
+
+@patch("httpx.AsyncClient.post", new=mock_kubernetes_selfsubjectreview_http_error)
+def test_kubernetes_auth_http_error(kubernetes_auth_client, valid_token):
+    response = kubernetes_auth_client.get("/test", headers={"Authorization": f"Bearer {valid_token}"})
+    assert response.status_code == 401
+    assert "Token validation failed" in response.json()["error"]["message"]
+
+
+def test_kubernetes_auth_request_payload(kubernetes_auth_client, valid_token, mock_kubernetes_api_server):
+    with patch("httpx.AsyncClient.post") as mock_post:
+        mock_response = MockResponse(
+            200,
+            {
+                "apiVersion": "authentication.k8s.io/v1",
+                "kind": "SelfSubjectReview",
+                "metadata": {"creationTimestamp": "2025-07-15T13:53:56Z"},
+                "status": {
+                    "userInfo": {
+                        "username": "test-user",
+                        "uid": "test-uid",
+                        "groups": ["test-group"],
+                    }
+                },
+            },
+        )
+        mock_post.return_value = mock_response
+
+        kubernetes_auth_client.get("/test", headers={"Authorization": f"Bearer {valid_token}"})
+
+        # Verify the request was made with correct parameters
+        mock_post.assert_called_once()
+        call_args = mock_post.call_args
+
+        # Check URL (passed as positional argument)
+        assert call_args[0][0] == f"{mock_kubernetes_api_server}/apis/authentication.k8s.io/v1/selfsubjectreviews"
+
+        # Check headers (passed as keyword argument)
+        headers = call_args[1]["headers"]
+        assert headers["Authorization"] == f"Bearer {valid_token}"
+        assert headers["Content-Type"] == "application/json"
+
+        # Check request body (passed as keyword argument)
+        request_body = call_args[1]["json"]
+        assert request_body["apiVersion"] == "authentication.k8s.io/v1"
+        assert request_body["kind"] == "SelfSubjectReview"

From 9618adba8990f1404f1c4de48c3ff03780622f76 Mon Sep 17 00:00:00 2001
From: Mohammad Daoud Farooqi <mohammaddaoud.farooqi@gmail.com>
Date: Mon, 8 Sep 2025 17:39:13 +0530
Subject: [PATCH 41/76] docs: add MongoDB to external provider list (#3369)

The MongoDB integration - Vector search, Full-Text search and Hybrid
search have now been added as an external provider offering for Llama
Stack: https://github.com/mongodb-partners/mongodb-llama-stack
---
 docs/source/providers/external/external-providers-list.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docs/source/providers/external/external-providers-list.md b/docs/source/providers/external/external-providers-list.md
index 49f49076b..45fcc50fb 100644
--- a/docs/source/providers/external/external-providers-list.md
+++ b/docs/source/providers/external/external-providers-list.md
@@ -7,4 +7,5 @@ Here's a list of known external providers that you can use with Llama Stack:
 | KubeFlow Training | Train models with KubeFlow | Post Training | Remote | [llama-stack-provider-kft](https://github.com/opendatahub-io/llama-stack-provider-kft) |
 | KubeFlow Pipelines | Train models with KubeFlow Pipelines | Post Training | Inline **and** Remote | [llama-stack-provider-kfp-trainer](https://github.com/opendatahub-io/llama-stack-provider-kfp-trainer) |
 | RamaLama | Inference models with RamaLama | Inference | Remote | [ramalama-stack](https://github.com/containers/ramalama-stack) |
-| TrustyAI LM-Eval | Evaluate models with TrustyAI LM-Eval | Eval | Remote | [llama-stack-provider-lmeval](https://github.com/trustyai-explainability/llama-stack-provider-lmeval) |
\ No newline at end of file
+| TrustyAI LM-Eval | Evaluate models with TrustyAI LM-Eval | Eval | Remote | [llama-stack-provider-lmeval](https://github.com/trustyai-explainability/llama-stack-provider-lmeval) |
+| MongoDB | VectorIO with MongoDB | Vector_IO | Remote | [mongodb-llama-stack](https://github.com/mongodb-partners/mongodb-llama-stack) |

From ad6ea7fb91f79023f821462286e69da2642e297c Mon Sep 17 00:00:00 2001
From: Francisco Arceo <arceofrancisco@gmail.com>
Date: Mon, 8 Sep 2025 09:05:13 -0600
Subject: [PATCH 42/76] feat: Adding OpenAI Prompts API (#3319)

# What does this PR do?
This PR adds support for OpenAI Prompts API.

Note, OpenAI does not explicitly expose the Prompts API but instead
makes it available in the Responses API and in the [Prompts
Dashboard](https://platform.openai.com/docs/guides/prompting#create-a-prompt).

I have added the following APIs:
- CREATE
- GET
- LIST
- UPDATE
- Set Default Version

The Set Default Version API is made available only in the Prompts
Dashboard and configures which prompt version is returned in the GET
(the latest version is the default).

Overall, the expected functionality in Responses will look like this:

```python
from openai import OpenAI
client = OpenAI()

response = client.responses.create(
  prompt={
    "id": "pmpt_68b0c29740048196bd3a6e6ac3c4d0e20ed9a13f0d15bf5e",
    "version": "2",
    "variables": {
        "city": "San Francisco",
        "age": 30,
    }
  }
)
```

### Resolves https://github.com/llamastack/llama-stack/issues/3276


## Test Plan
Unit tests added. Integration tests can be added after client
generation.

## Next Steps
1. Update Responses API to support Prompt API
2. I'll enhance the UI to implement the Prompt Dashboard.
3. Add cache for lower latency

---------

Signed-off-by: Francisco Javier Arceo <farceo@redhat.com>
---
 docs/_static/llama-stack-spec.html         | 457 ++++++++++++++++++++-
 docs/_static/llama-stack-spec.yaml         | 332 +++++++++++++++
 llama_stack/apis/datatypes.py              |   2 +
 llama_stack/apis/prompts/__init__.py       |   9 +
 llama_stack/apis/prompts/prompts.py        | 189 +++++++++
 llama_stack/apis/resource.py               |   1 +
 llama_stack/core/prompts/__init__.py       |   5 +
 llama_stack/core/prompts/prompts.py        | 233 +++++++++++
 llama_stack/core/resolver.py               |   2 +
 llama_stack/core/server/server.py          |   1 +
 llama_stack/core/stack.py                  |  12 +
 tests/unit/prompts/prompts/__init__.py     |   5 +
 tests/unit/prompts/prompts/conftest.py     |  30 ++
 tests/unit/prompts/prompts/test_prompts.py | 144 +++++++
 14 files changed, 1414 insertions(+), 8 deletions(-)
 create mode 100644 llama_stack/apis/prompts/__init__.py
 create mode 100644 llama_stack/apis/prompts/prompts.py
 create mode 100644 llama_stack/core/prompts/__init__.py
 create mode 100644 llama_stack/core/prompts/prompts.py
 create mode 100644 tests/unit/prompts/prompts/__init__.py
 create mode 100644 tests/unit/prompts/prompts/conftest.py
 create mode 100644 tests/unit/prompts/prompts/test_prompts.py

diff --git a/docs/_static/llama-stack-spec.html b/docs/_static/llama-stack-spec.html
index 7cb2a73f3..a036e5dc0 100644
--- a/docs/_static/llama-stack-spec.html
+++ b/docs/_static/llama-stack-spec.html
@@ -633,6 +633,80 @@
                 }
             }
         },
+        "/v1/prompts": {
+            "get": {
+                "responses": {
+                    "200": {
+                        "description": "A ListPromptsResponse containing all prompts.",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/ListPromptsResponse"
+                                }
+                            }
+                        }
+                    },
+                    "400": {
+                        "$ref": "#/components/responses/BadRequest400"
+                    },
+                    "429": {
+                        "$ref": "#/components/responses/TooManyRequests429"
+                    },
+                    "500": {
+                        "$ref": "#/components/responses/InternalServerError500"
+                    },
+                    "default": {
+                        "$ref": "#/components/responses/DefaultError"
+                    }
+                },
+                "tags": [
+                    "Prompts"
+                ],
+                "description": "List all prompts.",
+                "parameters": []
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "The created Prompt resource.",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/Prompt"
+                                }
+                            }
+                        }
+                    },
+                    "400": {
+                        "$ref": "#/components/responses/BadRequest400"
+                    },
+                    "429": {
+                        "$ref": "#/components/responses/TooManyRequests429"
+                    },
+                    "500": {
+                        "$ref": "#/components/responses/InternalServerError500"
+                    },
+                    "default": {
+                        "$ref": "#/components/responses/DefaultError"
+                    }
+                },
+                "tags": [
+                    "Prompts"
+                ],
+                "description": "Create a new prompt.",
+                "parameters": [],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/CreatePromptRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
+            }
+        },
         "/v1/agents/{agent_id}": {
             "get": {
                 "responses": {
@@ -901,6 +975,143 @@
                 ]
             }
         },
+        "/v1/prompts/{prompt_id}": {
+            "get": {
+                "responses": {
+                    "200": {
+                        "description": "A Prompt resource.",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/Prompt"
+                                }
+                            }
+                        }
+                    },
+                    "400": {
+                        "$ref": "#/components/responses/BadRequest400"
+                    },
+                    "429": {
+                        "$ref": "#/components/responses/TooManyRequests429"
+                    },
+                    "500": {
+                        "$ref": "#/components/responses/InternalServerError500"
+                    },
+                    "default": {
+                        "$ref": "#/components/responses/DefaultError"
+                    }
+                },
+                "tags": [
+                    "Prompts"
+                ],
+                "description": "Get a prompt by its identifier and optional version.",
+                "parameters": [
+                    {
+                        "name": "prompt_id",
+                        "in": "path",
+                        "description": "The identifier of the prompt to get.",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "version",
+                        "in": "query",
+                        "description": "The version of the prompt to get (defaults to latest).",
+                        "required": false,
+                        "schema": {
+                            "type": "integer"
+                        }
+                    }
+                ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "The updated Prompt resource with incremented version.",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/Prompt"
+                                }
+                            }
+                        }
+                    },
+                    "400": {
+                        "$ref": "#/components/responses/BadRequest400"
+                    },
+                    "429": {
+                        "$ref": "#/components/responses/TooManyRequests429"
+                    },
+                    "500": {
+                        "$ref": "#/components/responses/InternalServerError500"
+                    },
+                    "default": {
+                        "$ref": "#/components/responses/DefaultError"
+                    }
+                },
+                "tags": [
+                    "Prompts"
+                ],
+                "description": "Update an existing prompt (increments version).",
+                "parameters": [
+                    {
+                        "name": "prompt_id",
+                        "in": "path",
+                        "description": "The identifier of the prompt to update.",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/UpdatePromptRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
+            },
+            "delete": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    },
+                    "400": {
+                        "$ref": "#/components/responses/BadRequest400"
+                    },
+                    "429": {
+                        "$ref": "#/components/responses/TooManyRequests429"
+                    },
+                    "500": {
+                        "$ref": "#/components/responses/InternalServerError500"
+                    },
+                    "default": {
+                        "$ref": "#/components/responses/DefaultError"
+                    }
+                },
+                "tags": [
+                    "Prompts"
+                ],
+                "description": "Delete a prompt.",
+                "parameters": [
+                    {
+                        "name": "prompt_id",
+                        "in": "path",
+                        "description": "The identifier of the prompt to delete.",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            }
+        },
         "/v1/inference/embeddings": {
             "post": {
                 "responses": {
@@ -2836,6 +3047,49 @@
                 ]
             }
         },
+        "/v1/prompts/{prompt_id}/versions": {
+            "get": {
+                "responses": {
+                    "200": {
+                        "description": "A ListPromptsResponse containing all versions of the prompt.",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/ListPromptsResponse"
+                                }
+                            }
+                        }
+                    },
+                    "400": {
+                        "$ref": "#/components/responses/BadRequest400"
+                    },
+                    "429": {
+                        "$ref": "#/components/responses/TooManyRequests429"
+                    },
+                    "500": {
+                        "$ref": "#/components/responses/InternalServerError500"
+                    },
+                    "default": {
+                        "$ref": "#/components/responses/DefaultError"
+                    }
+                },
+                "tags": [
+                    "Prompts"
+                ],
+                "description": "List all versions of a specific prompt.",
+                "parameters": [
+                    {
+                        "name": "prompt_id",
+                        "in": "path",
+                        "description": "The identifier of the prompt to list versions for.",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            }
+        },
         "/v1/providers": {
             "get": {
                 "responses": {
@@ -5007,6 +5261,59 @@
                 }
             }
         },
+        "/v1/prompts/{prompt_id}/set-default-version": {
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "The prompt with the specified version now set as default.",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/Prompt"
+                                }
+                            }
+                        }
+                    },
+                    "400": {
+                        "$ref": "#/components/responses/BadRequest400"
+                    },
+                    "429": {
+                        "$ref": "#/components/responses/TooManyRequests429"
+                    },
+                    "500": {
+                        "$ref": "#/components/responses/InternalServerError500"
+                    },
+                    "default": {
+                        "$ref": "#/components/responses/DefaultError"
+                    }
+                },
+                "tags": [
+                    "Prompts"
+                ],
+                "description": "Set which version of a prompt should be the default in get_prompt (latest).",
+                "parameters": [
+                    {
+                        "name": "prompt_id",
+                        "in": "path",
+                        "description": "The identifier of the prompt.",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/SetDefaultVersionRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
+            }
+        },
         "/v1/post-training/supervised-fine-tune": {
             "post": {
                 "responses": {
@@ -9670,6 +9977,65 @@
                 ],
                 "title": "OpenAIResponseObjectStreamResponseWebSearchCallSearching"
             },
+            "CreatePromptRequest": {
+                "type": "object",
+                "properties": {
+                    "prompt": {
+                        "type": "string",
+                        "description": "The prompt text content with variable placeholders."
+                    },
+                    "variables": {
+                        "type": "array",
+                        "items": {
+                            "type": "string"
+                        },
+                        "description": "List of variable names that can be used in the prompt template."
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "prompt"
+                ],
+                "title": "CreatePromptRequest"
+            },
+            "Prompt": {
+                "type": "object",
+                "properties": {
+                    "prompt": {
+                        "type": "string",
+                        "description": "The system prompt text with variable placeholders. Variables are only supported when using the Responses API."
+                    },
+                    "version": {
+                        "type": "integer",
+                        "description": "Version (integer starting at 1, incremented on save)"
+                    },
+                    "prompt_id": {
+                        "type": "string",
+                        "description": "Unique identifier formatted as 'pmpt_<48-digit-hash>'"
+                    },
+                    "variables": {
+                        "type": "array",
+                        "items": {
+                            "type": "string"
+                        },
+                        "description": "List of prompt variable names that can be used in the prompt template"
+                    },
+                    "is_default": {
+                        "type": "boolean",
+                        "default": false,
+                        "description": "Boolean indicating whether this version is the default version for this prompt"
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "version",
+                    "prompt_id",
+                    "variables",
+                    "is_default"
+                ],
+                "title": "Prompt",
+                "description": "A prompt resource representing a stored OpenAI Compatible prompt template in Llama Stack."
+            },
             "OpenAIDeleteResponseObject": {
                 "type": "object",
                 "properties": {
@@ -10296,7 +10662,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "benchmark",
                         "default": "benchmark",
@@ -10923,7 +11290,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "dataset",
                         "default": "dataset",
@@ -11073,7 +11441,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "model",
                         "default": "model",
@@ -11338,7 +11707,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "scoring_function",
                         "default": "scoring_function",
@@ -11446,7 +11816,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "shield",
                         "default": "shield",
@@ -11691,7 +12062,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "tool",
                         "default": "tool",
@@ -11773,7 +12145,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "tool_group",
                         "default": "tool_group",
@@ -12067,7 +12440,8 @@
                             "scoring_function",
                             "benchmark",
                             "tool",
-                            "tool_group"
+                            "tool_group",
+                            "prompt"
                         ],
                         "const": "vector_db",
                         "default": "vector_db",
@@ -12882,6 +13256,23 @@
                 "title": "OpenAIResponseObjectWithInput",
                 "description": "OpenAI response object extended with input context information."
             },
+            "ListPromptsResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/Prompt"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ],
+                "title": "ListPromptsResponse",
+                "description": "Response model to list prompts."
+            },
             "ListProvidersResponse": {
                 "type": "object",
                 "properties": {
@@ -17128,6 +17519,20 @@
                 "title": "ScoreBatchResponse",
                 "description": "Response from batch scoring operations on datasets."
             },
+            "SetDefaultVersionRequest": {
+                "type": "object",
+                "properties": {
+                    "version": {
+                        "type": "integer",
+                        "description": "The version to set as default."
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "version"
+                ],
+                "title": "SetDefaultVersionRequest"
+            },
             "AlgorithmConfig": {
                 "oneOf": [
                     {
@@ -17412,6 +17817,37 @@
                 "title": "SyntheticDataGenerationResponse",
                 "description": "Response from the synthetic data generation. Batch of (prompt, response, score) tuples that pass the threshold."
             },
+            "UpdatePromptRequest": {
+                "type": "object",
+                "properties": {
+                    "prompt": {
+                        "type": "string",
+                        "description": "The updated prompt text content."
+                    },
+                    "version": {
+                        "type": "integer",
+                        "description": "The current version of the prompt being updated."
+                    },
+                    "variables": {
+                        "type": "array",
+                        "items": {
+                            "type": "string"
+                        },
+                        "description": "Updated list of variable names that can be used in the prompt template."
+                    },
+                    "set_as_default": {
+                        "type": "boolean",
+                        "description": "Set the new version as the default (default=True)."
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "prompt",
+                    "version",
+                    "set_as_default"
+                ],
+                "title": "UpdatePromptRequest"
+            },
             "VersionInfo": {
                 "type": "object",
                 "properties": {
@@ -17537,6 +17973,10 @@
         {
             "name": "PostTraining (Coming Soon)"
         },
+        {
+            "name": "Prompts",
+            "x-displayName": "Protocol for prompt management operations."
+        },
         {
             "name": "Providers",
             "x-displayName": "Providers API for inspecting, listing, and modifying providers and their configurations."
@@ -17587,6 +18027,7 @@
                 "Inspect",
                 "Models",
                 "PostTraining (Coming Soon)",
+                "Prompts",
                 "Providers",
                 "Safety",
                 "Scoring",
diff --git a/docs/_static/llama-stack-spec.yaml b/docs/_static/llama-stack-spec.yaml
index 25089868c..8ed04c1f8 100644
--- a/docs/_static/llama-stack-spec.yaml
+++ b/docs/_static/llama-stack-spec.yaml
@@ -427,6 +427,58 @@ paths:
             schema:
               $ref: '#/components/schemas/CreateOpenaiResponseRequest'
         required: true
+  /v1/prompts:
+    get:
+      responses:
+        '200':
+          description: >-
+            A ListPromptsResponse containing all prompts.
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ListPromptsResponse'
+        '400':
+          $ref: '#/components/responses/BadRequest400'
+        '429':
+          $ref: >-
+            #/components/responses/TooManyRequests429
+        '500':
+          $ref: >-
+            #/components/responses/InternalServerError500
+        default:
+          $ref: '#/components/responses/DefaultError'
+      tags:
+        - Prompts
+      description: List all prompts.
+      parameters: []
+    post:
+      responses:
+        '200':
+          description: The created Prompt resource.
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/Prompt'
+        '400':
+          $ref: '#/components/responses/BadRequest400'
+        '429':
+          $ref: >-
+            #/components/responses/TooManyRequests429
+        '500':
+          $ref: >-
+            #/components/responses/InternalServerError500
+        default:
+          $ref: '#/components/responses/DefaultError'
+      tags:
+        - Prompts
+      description: Create a new prompt.
+      parameters: []
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/CreatePromptRequest'
+        required: true
   /v1/agents/{agent_id}:
     get:
       responses:
@@ -616,6 +668,103 @@ paths:
           required: true
           schema:
             type: string
+  /v1/prompts/{prompt_id}:
+    get:
+      responses:
+        '200':
+          description: A Prompt resource.
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/Prompt'
+        '400':
+          $ref: '#/components/responses/BadRequest400'
+        '429':
+          $ref: >-
+            #/components/responses/TooManyRequests429
+        '500':
+          $ref: >-
+            #/components/responses/InternalServerError500
+        default:
+          $ref: '#/components/responses/DefaultError'
+      tags:
+        - Prompts
+      description: >-
+        Get a prompt by its identifier and optional version.
+      parameters:
+        - name: prompt_id
+          in: path
+          description: The identifier of the prompt to get.
+          required: true
+          schema:
+            type: string
+        - name: version
+          in: query
+          description: >-
+            The version of the prompt to get (defaults to latest).
+          required: false
+          schema:
+            type: integer
+    post:
+      responses:
+        '200':
+          description: >-
+            The updated Prompt resource with incremented version.
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/Prompt'
+        '400':
+          $ref: '#/components/responses/BadRequest400'
+        '429':
+          $ref: >-
+            #/components/responses/TooManyRequests429
+        '500':
+          $ref: >-
+            #/components/responses/InternalServerError500
+        default:
+          $ref: '#/components/responses/DefaultError'
+      tags:
+        - Prompts
+      description: >-
+        Update an existing prompt (increments version).
+      parameters:
+        - name: prompt_id
+          in: path
+          description: The identifier of the prompt to update.
+          required: true
+          schema:
+            type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/UpdatePromptRequest'
+        required: true
+    delete:
+      responses:
+        '200':
+          description: OK
+        '400':
+          $ref: '#/components/responses/BadRequest400'
+        '429':
+          $ref: >-
+            #/components/responses/TooManyRequests429
+        '500':
+          $ref: >-
+            #/components/responses/InternalServerError500
+        default:
+          $ref: '#/components/responses/DefaultError'
+      tags:
+        - Prompts
+      description: Delete a prompt.
+      parameters:
+        - name: prompt_id
+          in: path
+          description: The identifier of the prompt to delete.
+          required: true
+          schema:
+            type: string
   /v1/inference/embeddings:
     post:
       responses:
@@ -1983,6 +2132,37 @@ paths:
           required: false
           schema:
             $ref: '#/components/schemas/Order'
+  /v1/prompts/{prompt_id}/versions:
+    get:
+      responses:
+        '200':
+          description: >-
+            A ListPromptsResponse containing all versions of the prompt.
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ListPromptsResponse'
+        '400':
+          $ref: '#/components/responses/BadRequest400'
+        '429':
+          $ref: >-
+            #/components/responses/TooManyRequests429
+        '500':
+          $ref: >-
+            #/components/responses/InternalServerError500
+        default:
+          $ref: '#/components/responses/DefaultError'
+      tags:
+        - Prompts
+      description: List all versions of a specific prompt.
+      parameters:
+        - name: prompt_id
+          in: path
+          description: >-
+            The identifier of the prompt to list versions for.
+          required: true
+          schema:
+            type: string
   /v1/providers:
     get:
       responses:
@@ -3546,6 +3726,43 @@ paths:
             schema:
               $ref: '#/components/schemas/ScoreBatchRequest'
         required: true
+  /v1/prompts/{prompt_id}/set-default-version:
+    post:
+      responses:
+        '200':
+          description: >-
+            The prompt with the specified version now set as default.
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/Prompt'
+        '400':
+          $ref: '#/components/responses/BadRequest400'
+        '429':
+          $ref: >-
+            #/components/responses/TooManyRequests429
+        '500':
+          $ref: >-
+            #/components/responses/InternalServerError500
+        default:
+          $ref: '#/components/responses/DefaultError'
+      tags:
+        - Prompts
+      description: >-
+        Set which version of a prompt should be the default in get_prompt (latest).
+      parameters:
+        - name: prompt_id
+          in: path
+          description: The identifier of the prompt.
+          required: true
+          schema:
+            type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/SetDefaultVersionRequest'
+        required: true
   /v1/post-training/supervised-fine-tune:
     post:
       responses:
@@ -7148,6 +7365,61 @@ components:
         - type
       title: >-
         OpenAIResponseObjectStreamResponseWebSearchCallSearching
+    CreatePromptRequest:
+      type: object
+      properties:
+        prompt:
+          type: string
+          description: >-
+            The prompt text content with variable placeholders.
+        variables:
+          type: array
+          items:
+            type: string
+          description: >-
+            List of variable names that can be used in the prompt template.
+      additionalProperties: false
+      required:
+        - prompt
+      title: CreatePromptRequest
+    Prompt:
+      type: object
+      properties:
+        prompt:
+          type: string
+          description: >-
+            The system prompt text with variable placeholders. Variables are only
+            supported when using the Responses API.
+        version:
+          type: integer
+          description: >-
+            Version (integer starting at 1, incremented on save)
+        prompt_id:
+          type: string
+          description: >-
+            Unique identifier formatted as 'pmpt_<48-digit-hash>'
+        variables:
+          type: array
+          items:
+            type: string
+          description: >-
+            List of prompt variable names that can be used in the prompt template
+        is_default:
+          type: boolean
+          default: false
+          description: >-
+            Boolean indicating whether this version is the default version for this
+            prompt
+      additionalProperties: false
+      required:
+        - version
+        - prompt_id
+        - variables
+        - is_default
+      title: Prompt
+      description: >-
+        A prompt resource representing a stored OpenAI Compatible prompt template
+        in Llama Stack.
     OpenAIDeleteResponseObject:
       type: object
       properties:
@@ -7621,6 +7893,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: benchmark
           default: benchmark
           description: The resource type, always benchmark
@@ -8107,6 +8380,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: dataset
           default: dataset
           description: >-
@@ -8219,6 +8493,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: model
           default: model
           description: >-
@@ -8410,6 +8685,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: scoring_function
           default: scoring_function
           description: >-
@@ -8486,6 +8762,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: shield
           default: shield
           description: The resource type, always shield
@@ -8665,6 +8942,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: tool
           default: tool
           description: Type of resource, always 'tool'
@@ -8723,6 +9001,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: tool_group
           default: tool_group
           description: Type of resource, always 'tool_group'
@@ -8951,6 +9230,7 @@ components:
             - benchmark
             - tool
             - tool_group
+            - prompt
           const: vector_db
           default: vector_db
           description: >-
@@ -9577,6 +9857,18 @@ components:
       title: OpenAIResponseObjectWithInput
       description: >-
         OpenAI response object extended with input context information.
+    ListPromptsResponse:
+      type: object
+      properties:
+        data:
+          type: array
+          items:
+            $ref: '#/components/schemas/Prompt'
+      additionalProperties: false
+      required:
+        - data
+      title: ListPromptsResponse
+      description: Response model to list prompts.
     ListProvidersResponse:
       type: object
       properties:
@@ -12722,6 +13014,16 @@ components:
       title: ScoreBatchResponse
       description: >-
         Response from batch scoring operations on datasets.
+    SetDefaultVersionRequest:
+      type: object
+      properties:
+        version:
+          type: integer
+          description: The version to set as default.
+      additionalProperties: false
+      required:
+        - version
+      title: SetDefaultVersionRequest
     AlgorithmConfig:
       oneOf:
         - $ref: '#/components/schemas/LoraFinetuningConfig'
@@ -12918,6 +13220,32 @@ components:
       description: >-
         Response from the synthetic data generation. Batch of (prompt, response, score)
         tuples that pass the threshold.
+    UpdatePromptRequest:
+      type: object
+      properties:
+        prompt:
+          type: string
+          description: The updated prompt text content.
+        version:
+          type: integer
+          description: >-
+            The current version of the prompt being updated.
+        variables:
+          type: array
+          items:
+            type: string
+          description: >-
+            Updated list of variable names that can be used in the prompt template.
+        set_as_default:
+          type: boolean
+          description: >-
+            Set the new version as the default (default=True).
+      additionalProperties: false
+      required:
+        - prompt
+        - version
+        - set_as_default
+      title: UpdatePromptRequest
     VersionInfo:
       type: object
       properties:
@@ -13029,6 +13357,9 @@ tags:
   - name: Inspect
   - name: Models
   - name: PostTraining (Coming Soon)
+  - name: Prompts
+    x-displayName: >-
+      Protocol for prompt management operations.
   - name: Providers
     x-displayName: >-
       Providers API for inspecting, listing, and modifying providers and their configurations.
@@ -13056,6 +13387,7 @@ x-tagGroups:
       - Inspect
       - Models
       - PostTraining (Coming Soon)
+      - Prompts
       - Providers
       - Safety
       - Scoring
diff --git a/llama_stack/apis/datatypes.py b/llama_stack/apis/datatypes.py
index 87fc95917..8d0f2e26d 100644
--- a/llama_stack/apis/datatypes.py
+++ b/llama_stack/apis/datatypes.py
@@ -102,6 +102,7 @@ class Api(Enum, metaclass=DynamicApiMeta):
     :cvar benchmarks: Benchmark suite management
     :cvar tool_groups: Tool group organization
     :cvar files: File storage and management
+    :cvar prompts: Prompt versions and management
     :cvar inspect: Built-in system inspection and introspection
     """
 
@@ -127,6 +128,7 @@ class Api(Enum, metaclass=DynamicApiMeta):
     benchmarks = "benchmarks"
     tool_groups = "tool_groups"
     files = "files"
+    prompts = "prompts"
 
     # built-in API
     inspect = "inspect"
diff --git a/llama_stack/apis/prompts/__init__.py b/llama_stack/apis/prompts/__init__.py
new file mode 100644
index 000000000..6070f3450
--- /dev/null
+++ b/llama_stack/apis/prompts/__init__.py
@@ -0,0 +1,9 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+from .prompts import ListPromptsResponse, Prompt, Prompts
+
+__all__ = ["Prompt", "Prompts", "ListPromptsResponse"]
diff --git a/llama_stack/apis/prompts/prompts.py b/llama_stack/apis/prompts/prompts.py
new file mode 100644
index 000000000..e6a376c3f
--- /dev/null
+++ b/llama_stack/apis/prompts/prompts.py
@@ -0,0 +1,189 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+import re
+import secrets
+from typing import Protocol, runtime_checkable
+
+from pydantic import BaseModel, Field, field_validator, model_validator
+
+from llama_stack.providers.utils.telemetry.trace_protocol import trace_protocol
+from llama_stack.schema_utils import json_schema_type, webmethod
+
+
+@json_schema_type
+class Prompt(BaseModel):
+    """A prompt resource representing a stored OpenAI Compatible prompt template in Llama Stack.
+
+    :param prompt: The system prompt text with variable placeholders. Variables are only supported when using the Responses API.
+    :param version: Version (integer starting at 1, incremented on save)
+    :param prompt_id: Unique identifier formatted as 'pmpt_<48-digit-hash>'
+    :param variables: List of prompt variable names that can be used in the prompt template
+    :param is_default: Boolean indicating whether this version is the default version for this prompt
+    """
+
+    prompt: str | None = Field(default=None, description="The system prompt with variable placeholders")
+    version: int = Field(description="Version (integer starting at 1, incremented on save)", ge=1)
+    prompt_id: str = Field(description="Unique identifier in format 'pmpt_<48-digit-hash>'")
+    variables: list[str] = Field(
+        default_factory=list, description="List of variable names that can be used in the prompt template"
+    )
+    is_default: bool = Field(
+        default=False, description="Boolean indicating whether this version is the default version"
+    )
+
+    @field_validator("prompt_id")
+    @classmethod
+    def validate_prompt_id(cls, prompt_id: str) -> str:
+        if not isinstance(prompt_id, str):
+            raise TypeError("prompt_id must be a string in format 'pmpt_<48-digit-hash>'")
+
+        if not prompt_id.startswith("pmpt_"):
+            raise ValueError("prompt_id must start with 'pmpt_' prefix")
+
+        hex_part = prompt_id[5:]
+        if len(hex_part) != 48:
+            raise ValueError("prompt_id must be in format 'pmpt_<48-digit-hash>' (48 lowercase hex chars)")
+
+        for char in hex_part:
+            if char not in "0123456789abcdef":
+                raise ValueError("prompt_id hex part must contain only lowercase hex characters [0-9a-f]")
+
+        return prompt_id
+
+    @field_validator("version")
+    @classmethod
+    def validate_version(cls, prompt_version: int) -> int:
+        if prompt_version < 1:
+            raise ValueError("version must be >= 1")
+        return prompt_version
+
+    @model_validator(mode="after")
+    def validate_prompt_variables(self):
+        """Validate that all variables used in the prompt are declared in the variables list."""
+        if not self.prompt:
+            return self
+
+        prompt_variables = set(re.findall(r"{{\s*(\w+)\s*}}", self.prompt))
+        declared_variables = set(self.variables)
+
+        undeclared = prompt_variables - declared_variables
+        if undeclared:
+            raise ValueError(f"Prompt contains undeclared variables: {sorted(undeclared)}")
+
+        return self
+
+    @classmethod
+    def generate_prompt_id(cls) -> str:
+        # Generate 48 hex characters (24 bytes)
+        random_bytes = secrets.token_bytes(24)
+        hex_string = random_bytes.hex()
+        return f"pmpt_{hex_string}"
+
+
+class ListPromptsResponse(BaseModel):
+    """Response model to list prompts."""
+
+    data: list[Prompt]
+
+
+@runtime_checkable
+@trace_protocol
+class Prompts(Protocol):
+    """Protocol for prompt management operations."""
+
+    @webmethod(route="/prompts", method="GET")
+    async def list_prompts(self) -> ListPromptsResponse:
+        """List all prompts.
+
+        :returns: A ListPromptsResponse containing all prompts.
+        """
+        ...
+
+    @webmethod(route="/prompts/{prompt_id}/versions", method="GET")
+    async def list_prompt_versions(
+        self,
+        prompt_id: str,
+    ) -> ListPromptsResponse:
+        """List all versions of a specific prompt.
+
+        :param prompt_id: The identifier of the prompt to list versions for.
+        :returns: A ListPromptsResponse containing all versions of the prompt.
+        """
+        ...
+
+    @webmethod(route="/prompts/{prompt_id}", method="GET")
+    async def get_prompt(
+        self,
+        prompt_id: str,
+        version: int | None = None,
+    ) -> Prompt:
+        """Get a prompt by its identifier and optional version.
+
+        :param prompt_id: The identifier of the prompt to get.
+        :param version: The version of the prompt to get (defaults to latest).
+        :returns: A Prompt resource.
+        """
+        ...
+
+    @webmethod(route="/prompts", method="POST")
+    async def create_prompt(
+        self,
+        prompt: str,
+        variables: list[str] | None = None,
+    ) -> Prompt:
+        """Create a new prompt.
+
+        :param prompt: The prompt text content with variable placeholders.
+        :param variables: List of variable names that can be used in the prompt template.
+        :returns: The created Prompt resource.
+        """
+        ...
+
+    @webmethod(route="/prompts/{prompt_id}", method="PUT")
+    async def update_prompt(
+        self,
+        prompt_id: str,
+        prompt: str,
+        version: int,
+        variables: list[str] | None = None,
+        set_as_default: bool = True,
+    ) -> Prompt:
+        """Update an existing prompt (increments version).
+
+        :param prompt_id: The identifier of the prompt to update.
+        :param prompt: The updated prompt text content.
+        :param version: The current version of the prompt being updated.
+        :param variables: Updated list of variable names that can be used in the prompt template.
+        :param set_as_default: Set the new version as the default (default=True).
+        :returns: The updated Prompt resource with incremented version.
+        """
+        ...
+
+    @webmethod(route="/prompts/{prompt_id}", method="DELETE")
+    async def delete_prompt(
+        self,
+        prompt_id: str,
+    ) -> None:
+        """Delete a prompt.
+
+        :param prompt_id: The identifier of the prompt to delete.
+        """
+        ...
+
+    @webmethod(route="/prompts/{prompt_id}/set-default-version", method="PUT")
+    async def set_default_version(
+        self,
+        prompt_id: str,
+        version: int,
+    ) -> Prompt:
+        """Set which version of a prompt should be the default in get_prompt (latest).
+
+        :param prompt_id: The identifier of the prompt.
+        :param version: The version to set as default.
+        :returns: The prompt with the specified version now set as default.
+        """
+        ...
diff --git a/llama_stack/apis/resource.py b/llama_stack/apis/resource.py
index 3731fbf1d..7c4130f7d 100644
--- a/llama_stack/apis/resource.py
+++ b/llama_stack/apis/resource.py
@@ -19,6 +19,7 @@ class ResourceType(StrEnum):
     benchmark = "benchmark"
     tool = "tool"
     tool_group = "tool_group"
+    prompt = "prompt"
 
 
 class Resource(BaseModel):
diff --git a/llama_stack/core/prompts/__init__.py b/llama_stack/core/prompts/__init__.py
new file mode 100644
index 000000000..756f351d8
--- /dev/null
+++ b/llama_stack/core/prompts/__init__.py
@@ -0,0 +1,5 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
diff --git a/llama_stack/core/prompts/prompts.py b/llama_stack/core/prompts/prompts.py
new file mode 100644
index 000000000..26e8f5cef
--- /dev/null
+++ b/llama_stack/core/prompts/prompts.py
@@ -0,0 +1,233 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+import json
+from typing import Any
+
+from pydantic import BaseModel
+
+from llama_stack.apis.prompts import ListPromptsResponse, Prompt, Prompts
+from llama_stack.core.datatypes import StackRunConfig
+from llama_stack.core.utils.config_dirs import DISTRIBS_BASE_DIR
+from llama_stack.providers.utils.kvstore import KVStore, kvstore_impl
+from llama_stack.providers.utils.kvstore.config import SqliteKVStoreConfig
+
+
+class PromptServiceConfig(BaseModel):
+    """Configuration for the built-in prompt service.
+
+    :param run_config: Stack run configuration containing distribution info
+    """
+
+    run_config: StackRunConfig
+
+
+async def get_provider_impl(config: PromptServiceConfig, deps: dict[Any, Any]):
+    """Get the prompt service implementation."""
+    impl = PromptServiceImpl(config, deps)
+    await impl.initialize()
+    return impl
+
+
+class PromptServiceImpl(Prompts):
+    """Built-in prompt service implementation using KVStore."""
+
+    def __init__(self, config: PromptServiceConfig, deps: dict[Any, Any]):
+        self.config = config
+        self.deps = deps
+        self.kvstore: KVStore
+
+    async def initialize(self) -> None:
+        kvstore_config = SqliteKVStoreConfig(
+            db_path=(DISTRIBS_BASE_DIR / self.config.run_config.image_name / "prompts.db").as_posix()
+        )
+        self.kvstore = await kvstore_impl(kvstore_config)
+
+    def _get_default_key(self, prompt_id: str) -> str:
+        """Get the KVStore key that stores the default version number."""
+        return f"prompts:v1:{prompt_id}:default"
+
+    async def _get_prompt_key(self, prompt_id: str, version: int | None = None) -> str:
+        """Get the KVStore key for prompt data, returning default version if applicable."""
+        if version:
+            return self._get_version_key(prompt_id, str(version))
+
+        default_key = self._get_default_key(prompt_id)
+        resolved_version = await self.kvstore.get(default_key)
+        if resolved_version is None:
+            raise ValueError(f"Prompt {prompt_id}:default not found")
+        return self._get_version_key(prompt_id, resolved_version)
+
+    def _get_version_key(self, prompt_id: str, version: str) -> str:
+        """Get the KVStore key for a specific prompt version."""
+        return f"prompts:v1:{prompt_id}:{version}"
+
+    def _get_list_key_prefix(self) -> str:
+        """Get the key prefix for listing prompts."""
+        return "prompts:v1:"
+
+    def _serialize_prompt(self, prompt: Prompt) -> str:
+        """Serialize a prompt to JSON string for storage."""
+        return json.dumps(
+            {
+                "prompt_id": prompt.prompt_id,
+                "prompt": prompt.prompt,
+                "version": prompt.version,
+                "variables": prompt.variables or [],
+                "is_default": prompt.is_default,
+            }
+        )
+
+    def _deserialize_prompt(self, data: str) -> Prompt:
+        """Deserialize a prompt from JSON string."""
+        obj = json.loads(data)
+        return Prompt(
+            prompt_id=obj["prompt_id"],
+            prompt=obj["prompt"],
+            version=obj["version"],
+            variables=obj.get("variables", []),
+            is_default=obj.get("is_default", False),
+        )
+
+    async def list_prompts(self) -> ListPromptsResponse:
+        """List all prompts (default versions only)."""
+        prefix = self._get_list_key_prefix()
+        keys = await self.kvstore.keys_in_range(prefix, prefix + "\xff")
+
+        prompts = []
+        for key in keys:
+            if key.endswith(":default"):
+                try:
+                    default_version = await self.kvstore.get(key)
+                    if default_version:
+                        prompt_id = key.replace(prefix, "").replace(":default", "")
+                        version_key = self._get_version_key(prompt_id, default_version)
+                        data = await self.kvstore.get(version_key)
+                        if data:
+                            prompt = self._deserialize_prompt(data)
+                            prompts.append(prompt)
+                except (json.JSONDecodeError, KeyError):
+                    continue
+
+        prompts.sort(key=lambda p: p.prompt_id or "", reverse=True)
+        return ListPromptsResponse(data=prompts)
+
+    async def get_prompt(self, prompt_id: str, version: int | None = None) -> Prompt:
+        """Get a prompt by its identifier and optional version."""
+        key = await self._get_prompt_key(prompt_id, version)
+        data = await self.kvstore.get(key)
+        if data is None:
+            raise ValueError(f"Prompt {prompt_id}:{version if version else 'default'} not found")
+        return self._deserialize_prompt(data)
+
+    async def create_prompt(
+        self,
+        prompt: str,
+        variables: list[str] | None = None,
+    ) -> Prompt:
+        """Create a new prompt."""
+        if variables is None:
+            variables = []
+
+        prompt_obj = Prompt(
+            prompt_id=Prompt.generate_prompt_id(),
+            prompt=prompt,
+            version=1,
+            variables=variables,
+        )
+
+        version_key = self._get_version_key(prompt_obj.prompt_id, str(prompt_obj.version))
+        data = self._serialize_prompt(prompt_obj)
+        await self.kvstore.set(version_key, data)
+
+        default_key = self._get_default_key(prompt_obj.prompt_id)
+        await self.kvstore.set(default_key, str(prompt_obj.version))
+
+        return prompt_obj
+
+    async def update_prompt(
+        self,
+        prompt_id: str,
+        prompt: str,
+        version: int,
+        variables: list[str] | None = None,
+        set_as_default: bool = True,
+    ) -> Prompt:
+        """Update an existing prompt (increments version)."""
+        if version < 1:
+            raise ValueError("Version must be >= 1")
+        if variables is None:
+            variables = []
+
+        prompt_versions = await self.list_prompt_versions(prompt_id)
+        latest_prompt = max(prompt_versions.data, key=lambda x: int(x.version))
+
+        if version and latest_prompt.version != version:
+            raise ValueError(
+                f"'{version}' is not the latest prompt version for prompt_id='{prompt_id}'. Use the latest version '{latest_prompt.version}' in request."
+            )
+
+        current_version = latest_prompt.version if version is None else version
+        new_version = current_version + 1
+
+        updated_prompt = Prompt(prompt_id=prompt_id, prompt=prompt, version=new_version, variables=variables)
+
+        version_key = self._get_version_key(prompt_id, str(new_version))
+        data = self._serialize_prompt(updated_prompt)
+        await self.kvstore.set(version_key, data)
+
+        if set_as_default:
+            await self.set_default_version(prompt_id, new_version)
+
+        return updated_prompt
+
+    async def delete_prompt(self, prompt_id: str) -> None:
+        """Delete a prompt and all its versions."""
+        await self.get_prompt(prompt_id)
+
+        prefix = f"prompts:v1:{prompt_id}:"
+        keys = await self.kvstore.keys_in_range(prefix, prefix + "\xff")
+
+        for key in keys:
+            await self.kvstore.delete(key)
+
+    async def list_prompt_versions(self, prompt_id: str) -> ListPromptsResponse:
+        """List all versions of a specific prompt."""
+        prefix = f"prompts:v1:{prompt_id}:"
+        keys = await self.kvstore.keys_in_range(prefix, prefix + "\xff")
+
+        default_version = None
+        prompts = []
+
+        for key in keys:
+            data = await self.kvstore.get(key)
+            if key.endswith(":default"):
+                default_version = data
+            else:
+                if data:
+                    prompt_obj = self._deserialize_prompt(data)
+                    prompts.append(prompt_obj)
+
+        if not prompts:
+            raise ValueError(f"Prompt {prompt_id} not found")
+
+        for prompt in prompts:
+            prompt.is_default = str(prompt.version) == default_version
+
+        prompts.sort(key=lambda x: x.version)
+        return ListPromptsResponse(data=prompts)
+
+    async def set_default_version(self, prompt_id: str, version: int) -> Prompt:
+        """Set which version of a prompt should be the default, If not set. the default is the latest."""
+        version_key = self._get_version_key(prompt_id, str(version))
+        data = await self.kvstore.get(version_key)
+        if data is None:
+            raise ValueError(f"Prompt {prompt_id} version {version} not found")
+
+        default_key = self._get_default_key(prompt_id)
+        await self.kvstore.set(default_key, str(version))
+
+        return self._deserialize_prompt(data)
diff --git a/llama_stack/core/resolver.py b/llama_stack/core/resolver.py
index a8ad03e1a..373446de6 100644
--- a/llama_stack/core/resolver.py
+++ b/llama_stack/core/resolver.py
@@ -19,6 +19,7 @@ from llama_stack.apis.inference import Inference, InferenceProvider
 from llama_stack.apis.inspect import Inspect
 from llama_stack.apis.models import Models
 from llama_stack.apis.post_training import PostTraining
+from llama_stack.apis.prompts import Prompts
 from llama_stack.apis.providers import Providers as ProvidersAPI
 from llama_stack.apis.safety import Safety
 from llama_stack.apis.scoring import Scoring
@@ -93,6 +94,7 @@ def api_protocol_map(external_apis: dict[Api, ExternalApiSpec] | None = None) ->
         Api.tool_groups: ToolGroups,
         Api.tool_runtime: ToolRuntime,
         Api.files: Files,
+        Api.prompts: Prompts,
     }
 
     if external_apis:
diff --git a/llama_stack/core/server/server.py b/llama_stack/core/server/server.py
index 288bf46e1..d3e875fec 100644
--- a/llama_stack/core/server/server.py
+++ b/llama_stack/core/server/server.py
@@ -515,6 +515,7 @@ def main(args: argparse.Namespace | None = None):
 
     apis_to_serve.add("inspect")
     apis_to_serve.add("providers")
+    apis_to_serve.add("prompts")
     for api_str in apis_to_serve:
         api = Api(api_str)
 
diff --git a/llama_stack/core/stack.py b/llama_stack/core/stack.py
index bccea48d3..7ab8d2c64 100644
--- a/llama_stack/core/stack.py
+++ b/llama_stack/core/stack.py
@@ -24,6 +24,7 @@ from llama_stack.apis.inference import Inference
 from llama_stack.apis.inspect import Inspect
 from llama_stack.apis.models import Models
 from llama_stack.apis.post_training import PostTraining
+from llama_stack.apis.prompts import Prompts
 from llama_stack.apis.providers import Providers
 from llama_stack.apis.safety import Safety
 from llama_stack.apis.scoring import Scoring
@@ -37,6 +38,7 @@ from llama_stack.apis.vector_io import VectorIO
 from llama_stack.core.datatypes import Provider, StackRunConfig
 from llama_stack.core.distribution import get_provider_registry
 from llama_stack.core.inspect import DistributionInspectConfig, DistributionInspectImpl
+from llama_stack.core.prompts.prompts import PromptServiceConfig, PromptServiceImpl
 from llama_stack.core.providers import ProviderImpl, ProviderImplConfig
 from llama_stack.core.resolver import ProviderRegistry, resolve_impls
 from llama_stack.core.routing_tables.common import CommonRoutingTableImpl
@@ -72,6 +74,7 @@ class LlamaStack(
     ToolRuntime,
     RAGToolRuntime,
     Files,
+    Prompts,
 ):
     pass
 
@@ -305,6 +308,12 @@ def add_internal_implementations(impls: dict[Api, Any], run_config: StackRunConf
     )
     impls[Api.providers] = providers_impl
 
+    prompts_impl = PromptServiceImpl(
+        PromptServiceConfig(run_config=run_config),
+        deps=impls,
+    )
+    impls[Api.prompts] = prompts_impl
+
 
 # Produces a stack of providers for the given run config. Not all APIs may be
 # asked for in the run config.
@@ -329,6 +338,9 @@ async def construct_stack(
     # Add internal implementations after all other providers are resolved
     add_internal_implementations(impls, run_config)
 
+    if Api.prompts in impls:
+        await impls[Api.prompts].initialize()
+
     await register_resources(run_config, impls)
 
     await refresh_registry_once(impls)
diff --git a/tests/unit/prompts/prompts/__init__.py b/tests/unit/prompts/prompts/__init__.py
new file mode 100644
index 000000000..756f351d8
--- /dev/null
+++ b/tests/unit/prompts/prompts/__init__.py
@@ -0,0 +1,5 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
diff --git a/tests/unit/prompts/prompts/conftest.py b/tests/unit/prompts/prompts/conftest.py
new file mode 100644
index 000000000..b2c619e49
--- /dev/null
+++ b/tests/unit/prompts/prompts/conftest.py
@@ -0,0 +1,30 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+import random
+
+import pytest
+
+from llama_stack.core.prompts.prompts import PromptServiceConfig, PromptServiceImpl
+from llama_stack.providers.utils.kvstore.config import SqliteKVStoreConfig
+
+
+@pytest.fixture
+async def temp_prompt_store(tmp_path_factory):
+    unique_id = f"prompt_store_{random.randint(1, 1000000)}"
+    temp_dir = tmp_path_factory.getbasetemp()
+    db_path = str(temp_dir / f"{unique_id}.db")
+
+    from llama_stack.core.datatypes import StackRunConfig
+    from llama_stack.providers.utils.kvstore import kvstore_impl
+
+    mock_run_config = StackRunConfig(image_name="test-distribution", apis=[], providers={})
+    config = PromptServiceConfig(run_config=mock_run_config)
+    store = PromptServiceImpl(config, deps={})
+
+    store.kvstore = await kvstore_impl(SqliteKVStoreConfig(db_path=db_path))
+
+    yield store
diff --git a/tests/unit/prompts/prompts/test_prompts.py b/tests/unit/prompts/prompts/test_prompts.py
new file mode 100644
index 000000000..792e55530
--- /dev/null
+++ b/tests/unit/prompts/prompts/test_prompts.py
@@ -0,0 +1,144 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+
+import pytest
+
+
+class TestPrompts:
+    async def test_create_and_get_prompt(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("Hello world!", ["name"])
+        assert prompt.prompt == "Hello world!"
+        assert prompt.version == 1
+        assert prompt.prompt_id.startswith("pmpt_")
+        assert prompt.variables == ["name"]
+
+        retrieved = await temp_prompt_store.get_prompt(prompt.prompt_id)
+        assert retrieved.prompt_id == prompt.prompt_id
+        assert retrieved.prompt == prompt.prompt
+
+    async def test_update_prompt(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("Original")
+        updated = await temp_prompt_store.update_prompt(prompt.prompt_id, "Updated", 1, ["v"])
+        assert updated.version == 2
+        assert updated.prompt == "Updated"
+
+    async def test_update_prompt_with_version(self, temp_prompt_store):
+        version_for_update = 1
+
+        prompt = await temp_prompt_store.create_prompt("Original")
+        assert prompt.version == 1
+        prompt = await temp_prompt_store.update_prompt(prompt.prompt_id, "Updated", version_for_update, ["v"])
+        assert prompt.version == 2
+
+        with pytest.raises(ValueError):
+            # now this is a stale version
+            await temp_prompt_store.update_prompt(prompt.prompt_id, "Another Update", version_for_update, ["v"])
+
+        with pytest.raises(ValueError):
+            # this version does not exist
+            await temp_prompt_store.update_prompt(prompt.prompt_id, "Another Update", 99, ["v"])
+
+    async def test_delete_prompt(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("to be deleted")
+        await temp_prompt_store.delete_prompt(prompt.prompt_id)
+        with pytest.raises(ValueError):
+            await temp_prompt_store.get_prompt(prompt.prompt_id)
+
+    async def test_list_prompts(self, temp_prompt_store):
+        response = await temp_prompt_store.list_prompts()
+        assert response.data == []
+
+        await temp_prompt_store.create_prompt("first")
+        await temp_prompt_store.create_prompt("second")
+
+        response = await temp_prompt_store.list_prompts()
+        assert len(response.data) == 2
+
+    async def test_version(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("V1")
+        await temp_prompt_store.update_prompt(prompt.prompt_id, "V2", 1)
+
+        v1 = await temp_prompt_store.get_prompt(prompt.prompt_id, version=1)
+        assert v1.version == 1 and v1.prompt == "V1"
+
+        latest = await temp_prompt_store.get_prompt(prompt.prompt_id)
+        assert latest.version == 2 and latest.prompt == "V2"
+
+    async def test_set_default_version(self, temp_prompt_store):
+        prompt0 = await temp_prompt_store.create_prompt("V1")
+        prompt1 = await temp_prompt_store.update_prompt(prompt0.prompt_id, "V2", 1)
+
+        assert (await temp_prompt_store.get_prompt(prompt0.prompt_id)).version == 2
+        prompt_default = await temp_prompt_store.set_default_version(prompt0.prompt_id, 1)
+        assert (await temp_prompt_store.get_prompt(prompt0.prompt_id)).version == 1
+        assert prompt_default.version == 1
+
+        prompt2 = await temp_prompt_store.update_prompt(prompt0.prompt_id, "V3", prompt1.version)
+        assert prompt2.version == 3
+
+    async def test_prompt_id_generation_and_validation(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("Test")
+        assert prompt.prompt_id.startswith("pmpt_")
+        assert len(prompt.prompt_id) == 53
+
+        with pytest.raises(ValueError):
+            await temp_prompt_store.get_prompt("invalid_id")
+
+    async def test_list_shows_default_versions(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("V1")
+        await temp_prompt_store.update_prompt(prompt.prompt_id, "V2", 1)
+        await temp_prompt_store.update_prompt(prompt.prompt_id, "V3", 2)
+
+        response = await temp_prompt_store.list_prompts()
+        listed_prompt = response.data[0]
+        assert listed_prompt.version == 3 and listed_prompt.prompt == "V3"
+
+        await temp_prompt_store.set_default_version(prompt.prompt_id, 1)
+
+        response = await temp_prompt_store.list_prompts()
+        listed_prompt = response.data[0]
+        assert listed_prompt.version == 1 and listed_prompt.prompt == "V1"
+        assert not (await temp_prompt_store.get_prompt(prompt.prompt_id, 3)).is_default
+
+    async def test_get_all_prompt_versions(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("V1")
+        await temp_prompt_store.update_prompt(prompt.prompt_id, "V2", 1)
+        await temp_prompt_store.update_prompt(prompt.prompt_id, "V3", 2)
+
+        versions = (await temp_prompt_store.list_prompt_versions(prompt.prompt_id)).data
+        assert len(versions) == 3
+        assert [v.version for v in versions] == [1, 2, 3]
+        assert [v.is_default for v in versions] == [False, False, True]
+
+        await temp_prompt_store.set_default_version(prompt.prompt_id, 2)
+        versions = (await temp_prompt_store.list_prompt_versions(prompt.prompt_id)).data
+        assert [v.is_default for v in versions] == [False, True, False]
+
+        with pytest.raises(ValueError):
+            await temp_prompt_store.list_prompt_versions("nonexistent")
+
+    async def test_prompt_variable_validation(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("Hello {{ name }}, you live in {{ city }}!", ["name", "city"])
+        assert prompt.variables == ["name", "city"]
+
+        prompt_no_vars = await temp_prompt_store.create_prompt("Hello world!", [])
+        assert prompt_no_vars.variables == []
+
+        with pytest.raises(ValueError, match="undeclared variables"):
+            await temp_prompt_store.create_prompt("Hello {{ name }}, invalid {{ unknown }}!", ["name"])
+
+    async def test_update_prompt_set_as_default_behavior(self, temp_prompt_store):
+        prompt = await temp_prompt_store.create_prompt("V1")
+        assert (await temp_prompt_store.get_prompt(prompt.prompt_id)).version == 1
+
+        prompt_v2 = await temp_prompt_store.update_prompt(prompt.prompt_id, "V2", 1, [], set_as_default=True)
+        assert prompt_v2.version == 2
+        assert (await temp_prompt_store.get_prompt(prompt.prompt_id)).version == 2
+
+        prompt_v3 = await temp_prompt_store.update_prompt(prompt.prompt_id, "V3", 2, [], set_as_default=False)
+        assert prompt_v3.version == 3
+        assert (await temp_prompt_store.get_prompt(prompt.prompt_id)).version == 2

From ef02b9ea101487ca1829795f18274ad96b211ff6 Mon Sep 17 00:00:00 2001
From: Derek Higgins <derekh@redhat.com>
Date: Mon, 8 Sep 2025 16:51:38 +0100
Subject: [PATCH 43/76] fix: environment variable typo in inference recorder
 error message (#3374)

The error message was referencing LLAMA_STACK_INFERENCE_MODE instead of
the correct LLAMA_STACK_TEST_INFERENCE_MODE environment variable.
---
 llama_stack/testing/inference_recorder.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/llama_stack/testing/inference_recorder.py b/llama_stack/testing/inference_recorder.py
index 5b64e26d3..298758c92 100644
--- a/llama_stack/testing/inference_recorder.py
+++ b/llama_stack/testing/inference_recorder.py
@@ -292,7 +292,7 @@ async def _patched_inference_method(original_method, self, client_type, endpoint
                 f"No recorded response found for request hash: {request_hash}\n"
                 f"Request: {method} {url} {body}\n"
                 f"Model: {body.get('model', 'unknown')}\n"
-                f"To record this response, run with LLAMA_STACK_INFERENCE_MODE=record"
+                f"To record this response, run with LLAMA_STACK_TEST_INFERENCE_MODE=record"
             )
 
     elif _current_mode == InferenceMode.RECORD:

From 09141361fbec54acb25ef0d13c542d6cc41c3b5c Mon Sep 17 00:00:00 2001
From: Swapna Lekkala <swapna942@meta.com>
Date: Mon, 8 Sep 2025 13:22:43 -0700
Subject: [PATCH 44/76] fix: use dataset version 4.0.0 or above

---
 pyproject.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index fb6d3a330..133b78dbf 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -114,7 +114,7 @@ test = [
     "psycopg2-binary>=2.9.0",
     "pypdf",
     "mcp",
-    "datasets",
+    "datasets>=4.0.0",
     "autoevals",
     "transformers",
     "sqlalchemy",

From c9268a7a8cf57e72e1facdb0e41e444575cc5170 Mon Sep 17 00:00:00 2001
From: slekkala1 <swapna942@meta.com>
Date: Mon, 8 Sep 2025 14:46:46 -0700
Subject: [PATCH 45/76] fix: pre-commit failing (#3381)

# What does this PR do?
Fix failing pre-commit,
https://github.com/llamastack/llama-stack/actions/workflows/pre-commit.yml


## Test Plan
CI
---
 uv.lock | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/uv.lock b/uv.lock
index 43cc59c7a..b38177245 100644
--- a/uv.lock
+++ b/uv.lock
@@ -1,5 +1,5 @@
 version = 1
-revision = 3
+revision = 2
 requires-python = ">=3.12"
 resolution-markers = [
     "(python_full_version >= '3.13' and platform_machine != 'aarch64' and sys_platform == 'linux') or (python_full_version >= '3.13' and sys_platform != 'darwin' and sys_platform != 'linux')",
@@ -895,7 +895,6 @@ dependencies = [
     { name = "numpy" },
     { name = "packaging" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/5c/f4/7c2136f4660ca504266cc08b38df2aa1db14fea93393b82e099ff34d7290/faiss_cpu-1.11.0.post1.tar.gz", hash = "sha256:06b1ea9ddec9e4d9a41c8ef7478d493b08d770e9a89475056e963081eed757d1", size = 70543, upload-time = "2025-07-15T09:15:02.127Z" }
 wheels = [
     { url = "https://files.pythonhosted.org/packages/30/1e/9980758efa55b4e7a5d6df1ae17c9ddbe5a636bfbf7d22d47c67f7a530f4/faiss_cpu-1.11.0.post1-cp312-cp312-macosx_13_0_x86_64.whl", hash = "sha256:68f6ce2d9c510a5765af2f5711bd76c2c37bd598af747f3300224bdccf45378c", size = 7913676, upload-time = "2025-07-15T09:14:06.077Z" },
     { url = "https://files.pythonhosted.org/packages/05/d1/bd785887085faa02916c52320527b8bb54288835b0a3138df89a0e323cc8/faiss_cpu-1.11.0.post1-cp312-cp312-macosx_14_0_arm64.whl", hash = "sha256:b940c530a8236cc0b9fd9d6e87b3d70b9c6c216bc2baf2649356c908902e52c9", size = 3313952, upload-time = "2025-07-15T09:14:07.584Z" },
@@ -1748,7 +1747,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/5f/e4/f1546746049c99c6b8b247e2f34485b9eae36faa9322b84e2a17262e6712/litellm-1.74.9-py3-none-any.whl", hash = "sha256:ab8f8a6e4d8689d3c7c4f9c3bbc7e46212cc3ebc74ddd0f3c0c921bb459c9874", size = 8740449, upload-time = "2025-07-28T16:42:36.8Z" },
 ]
 
-
 [[package]]
 name = "llama-stack"
 version = "0.2.20"
@@ -1958,7 +1956,7 @@ test = [
     { name = "aiosqlite" },
     { name = "autoevals" },
     { name = "chardet" },
-    { name = "datasets" },
+    { name = "datasets", specifier = ">=4.0.0" },
     { name = "mcp" },
     { name = "milvus-lite", specifier = ">=2.5.0" },
     { name = "openai", specifier = ">=1.100.0" },

From 30468d0c43277f066397cc94a6d44c3965b0409f Mon Sep 17 00:00:00 2001
From: Ashwin Bharambe <ashwin.bharambe@gmail.com>
Date: Mon, 8 Sep 2025 15:13:42 -0700
Subject: [PATCH 46/76] fix(deps): bump datasets versions for all providers
 (#3382)

Not doing so results in errors of the kind you see in:
https://github.com/llamastack/llama-stack-ops/actions/runs/17565092546/job/49890264353
---
 llama_stack/providers/registry/datasetio.py     | 4 ++--
 llama_stack/providers/registry/post_training.py | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/llama_stack/providers/registry/datasetio.py b/llama_stack/providers/registry/datasetio.py
index 43cde83fb..f641b4ce3 100644
--- a/llama_stack/providers/registry/datasetio.py
+++ b/llama_stack/providers/registry/datasetio.py
@@ -30,7 +30,7 @@ def available_providers() -> list[ProviderSpec]:
             adapter=AdapterSpec(
                 adapter_type="huggingface",
                 pip_packages=[
-                    "datasets",
+                    "datasets>=4.0.0",
                 ],
                 module="llama_stack.providers.remote.datasetio.huggingface",
                 config_class="llama_stack.providers.remote.datasetio.huggingface.HuggingfaceDatasetIOConfig",
@@ -42,7 +42,7 @@ def available_providers() -> list[ProviderSpec]:
             adapter=AdapterSpec(
                 adapter_type="nvidia",
                 pip_packages=[
-                    "datasets",
+                    "datasets>=4.0.0",
                 ],
                 module="llama_stack.providers.remote.datasetio.nvidia",
                 config_class="llama_stack.providers.remote.datasetio.nvidia.NvidiaDatasetIOConfig",
diff --git a/llama_stack/providers/registry/post_training.py b/llama_stack/providers/registry/post_training.py
index 67238e3fc..47aeb401e 100644
--- a/llama_stack/providers/registry/post_training.py
+++ b/llama_stack/providers/registry/post_training.py
@@ -48,7 +48,7 @@ def available_providers() -> list[ProviderSpec]:
         InlineProviderSpec(
             api=Api.post_training,
             provider_type="inline::huggingface-gpu",
-            pip_packages=["trl", "transformers", "peft", "datasets", "torch"],
+            pip_packages=["trl", "transformers", "peft", "datasets>=4.0.0", "torch"],
             module="llama_stack.providers.inline.post_training.huggingface",
             config_class="llama_stack.providers.inline.post_training.huggingface.HuggingFacePostTrainingConfig",
             api_dependencies=[

From 28696c3f30468677fb851b82846acae21deb3e66 Mon Sep 17 00:00:00 2001
From: "github-actions[bot]" <github-actions[bot]@users.noreply.github.com>
Date: Mon, 8 Sep 2025 22:30:03 +0000
Subject: [PATCH 47/76] build: Bump version to 0.2.21

---
 llama_stack/ui/package-lock.json |  8 ++++----
 llama_stack/ui/package.json      |  2 +-
 pyproject.toml                   |  6 +++---
 uv.lock                          | 14 +++++++-------
 4 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/llama_stack/ui/package-lock.json b/llama_stack/ui/package-lock.json
index cbe8e5557..1db1c61cd 100644
--- a/llama_stack/ui/package-lock.json
+++ b/llama_stack/ui/package-lock.json
@@ -18,7 +18,7 @@
         "class-variance-authority": "^0.7.1",
         "clsx": "^2.1.1",
         "framer-motion": "^12.23.12",
-        "llama-stack-client": "^0.2.20",
+        "llama-stack-client": "^0.2.21",
         "lucide-react": "^0.542.0",
         "next": "15.3.3",
         "next-auth": "^4.24.11",
@@ -10278,9 +10278,9 @@
       "license": "MIT"
     },
     "node_modules/llama-stack-client": {
-      "version": "0.2.20",
-      "resolved": "https://registry.npmjs.org/llama-stack-client/-/llama-stack-client-0.2.20.tgz",
-      "integrity": "sha512-1vD5nizTX5JEW8TADxKgy/P1W8YZoPSpdnmfxbdYbWgpQ3BWtbvLS6jmDk7VwVA5fRC4895VfHsRDfS1liHarw==",
+      "version": "0.2.21",
+      "resolved": "https://registry.npmjs.org/llama-stack-client/-/llama-stack-client-0.2.21.tgz",
+      "integrity": "sha512-rjU2Vx5xStxDYavU8K1An/SYXiQQjroLcK98B+p0Paz/a7OgRao2S0YwvThJjPUyChY4fO03UIXP9LpmHqlXWQ==",
       "license": "MIT",
       "dependencies": {
         "@types/node": "^18.11.18",
diff --git a/llama_stack/ui/package.json b/llama_stack/ui/package.json
index e817e9ae3..e50401fa6 100644
--- a/llama_stack/ui/package.json
+++ b/llama_stack/ui/package.json
@@ -23,7 +23,7 @@
     "class-variance-authority": "^0.7.1",
     "clsx": "^2.1.1",
     "framer-motion": "^12.23.12",
-    "llama-stack-client": "^0.2.20",
+    "llama-stack-client": "^0.2.21",
     "lucide-react": "^0.542.0",
     "next": "15.3.3",
     "next-auth": "^4.24.11",
diff --git a/pyproject.toml b/pyproject.toml
index 133b78dbf..0414aafb0 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -7,7 +7,7 @@ required-version = ">=0.7.0"
 
 [project]
 name = "llama_stack"
-version = "0.2.20"
+version = "0.2.21"
 authors = [{ name = "Meta Llama", email = "llama-oss@meta.com" }]
 description = "Llama Stack"
 readme = "README.md"
@@ -31,7 +31,7 @@ dependencies = [
     "huggingface-hub>=0.34.0,<1.0",
     "jinja2>=3.1.6",
     "jsonschema",
-    "llama-stack-client>=0.2.20",
+    "llama-stack-client>=0.2.21",
     "openai>=1.99.6",
     "prompt-toolkit",
     "python-dotenv",
@@ -55,7 +55,7 @@ dependencies = [
 ui = [
     "streamlit",
     "pandas",
-    "llama-stack-client>=0.2.20",
+    "llama-stack-client>=0.2.21",
     "streamlit-option-menu",
 ]
 
diff --git a/uv.lock b/uv.lock
index b38177245..2788c6fef 100644
--- a/uv.lock
+++ b/uv.lock
@@ -1,5 +1,5 @@
 version = 1
-revision = 2
+revision = 3
 requires-python = ">=3.12"
 resolution-markers = [
     "(python_full_version >= '3.13' and platform_machine != 'aarch64' and sys_platform == 'linux') or (python_full_version >= '3.13' and sys_platform != 'darwin' and sys_platform != 'linux')",
@@ -1749,7 +1749,7 @@ wheels = [
 
 [[package]]
 name = "llama-stack"
-version = "0.2.20"
+version = "0.2.21"
 source = { editable = "." }
 dependencies = [
     { name = "aiohttp" },
@@ -1887,8 +1887,8 @@ requires-dist = [
     { name = "huggingface-hub", specifier = ">=0.34.0,<1.0" },
     { name = "jinja2", specifier = ">=3.1.6" },
     { name = "jsonschema" },
-    { name = "llama-stack-client", specifier = ">=0.2.20" },
-    { name = "llama-stack-client", marker = "extra == 'ui'", specifier = ">=0.2.20" },
+    { name = "llama-stack-client", specifier = ">=0.2.21" },
+    { name = "llama-stack-client", marker = "extra == 'ui'", specifier = ">=0.2.21" },
     { name = "openai", specifier = ">=1.99.6" },
     { name = "opentelemetry-exporter-otlp-proto-http", specifier = ">=1.30.0" },
     { name = "opentelemetry-sdk", specifier = ">=1.30.0" },
@@ -1997,7 +1997,7 @@ unit = [
 
 [[package]]
 name = "llama-stack-client"
-version = "0.2.20"
+version = "0.2.21"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "anyio" },
@@ -2016,9 +2016,9 @@ dependencies = [
     { name = "tqdm" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/21/91/c5e32219a5192825dd601700e68205c815c5cfee60c64c22172e46a0c83e/llama_stack_client-0.2.20.tar.gz", hash = "sha256:356257f0a4bbb64205f89e113d715925853d5e34ec744e72466da72790ba415b", size = 318311, upload-time = "2025-08-29T21:10:12.854Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/f1/d3/8c50561d167f1e9b601b8fffe852b44c1ff97aaa6db6cdedd611d9e02a65/llama_stack_client-0.2.21.tar.gz", hash = "sha256:bd931fdcadedec5ccdbaa3c54d0c17761af1c227711ad6150dc0dd33d7b66ce2", size = 318319, upload-time = "2025-09-08T22:26:57.668Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/b0/ba/84914c4eead2fd9251c149fd6a7da28b78acd620793e3c4506116645cb60/llama_stack_client-0.2.20-py3-none-any.whl", hash = "sha256:6e178981d2ce971da2145c79d5b2b123fa50e063ed431494975c2ba01c5b8016", size = 369899, upload-time = "2025-08-29T21:10:11.113Z" },
+    { url = "https://files.pythonhosted.org/packages/02/77/dadc682046a2c7ad68be8d2d2afac7007bf4d22efb0d3929d85ab9706ffe/llama_stack_client-0.2.21-py3-none-any.whl", hash = "sha256:adba82fdf18ab3b8ac218cedba4927bd5d26c23c2318e75c8763a44bb6b40693", size = 369902, upload-time = "2025-09-08T22:26:56.308Z" },
 ]
 
 [[package]]

From a8aa815b6a194fad76e4e5f7e73faf588b5d0e01 Mon Sep 17 00:00:00 2001
From: Ashwin Bharambe <ashwin.bharambe@gmail.com>
Date: Tue, 9 Sep 2025 15:50:56 -0700
Subject: [PATCH 48/76] feat(tests): migrate to global "setups" system for test
 configuration (#3390)

This PR refactors the integration test system to use global "setups"
which provides better separation of concerns:

**suites = what to test, setups = how to configure.**

NOTE: if you naming suggestions, please provide feedback

Changes:
- New `tests/integration/setups.py` with global, reusable configurations
(ollama, vllm, gpt, claude)
- Modified `scripts/integration-tests.sh` options to match with the
underlying pytest options
    - Updated documentation to reflect the new global setup system

The main benefit is that setups can be reused across multiple suites
(e.g., use "gpt" with any suite) even though sometimes they could
specifically tailored for a suite (vision <> ollama-vision). It is now
easier to add new configurations without modifying existing suites.

Usage examples:
    - `pytest tests/integration --suite=responses --setup=gpt`
- `pytest tests/integration --suite=vision` # auto-selects
"ollama-vision" setup
    - `pytest tests/integration --suite=base --setup=vllm`
---
 .../actions/run-and-record-tests/action.yml   |  42 +++---
 .github/actions/setup-ollama/action.yml       |   4 +-
 .../actions/setup-test-environment/action.yml |  14 +-
 .github/workflows/integration-tests.yml       |  20 +--
 .../workflows/record-integration-tests.yml    |  32 ++---
 scripts/get_setup_env.py                      |  71 ++++++++++
 scripts/github/schedule-record-workflow.sh    |  57 ++++----
 scripts/integration-tests.sh                  | 106 ++++++++-------
 tests/integration/README.md                   |  48 ++++---
 tests/integration/conftest.py                 |  71 ++++++----
 tests/integration/suites.py                   | 126 +++++++++++++-----
 11 files changed, 385 insertions(+), 206 deletions(-)
 create mode 100644 scripts/get_setup_env.py

diff --git a/.github/actions/run-and-record-tests/action.yml b/.github/actions/run-and-record-tests/action.yml
index 7f028b104..a3eb31d9f 100644
--- a/.github/actions/run-and-record-tests/action.yml
+++ b/.github/actions/run-and-record-tests/action.yml
@@ -5,21 +5,22 @@ inputs:
   stack-config:
     description: 'Stack configuration to use'
     required: true
-  provider:
-    description: 'Provider to use for tests'
-    required: true
+  setup:
+    description: 'Setup to use for tests (e.g., ollama, gpt, vllm)'
+    required: false
+    default: ''
   inference-mode:
     description: 'Inference mode (record or replay)'
     required: true
-  test-suite:
+  suite:
     description: 'Test suite to use: base, responses, vision, etc.'
     required: false
     default: ''
-  test-subdirs:
-    description: 'Comma-separated list of test subdirectories to run; overrides test-suite'
+  subdirs:
+    description: 'Comma-separated list of test subdirectories to run; overrides suite'
     required: false
     default: ''
-  test-pattern:
+  pattern:
     description: 'Regex pattern to pass to pytest -k'
     required: false
     default: ''
@@ -37,14 +38,23 @@ runs:
     - name: Run Integration Tests
       shell: bash
       run: |
-        uv run --no-sync ./scripts/integration-tests.sh \
-          --stack-config '${{ inputs.stack-config }}' \
-          --provider '${{ inputs.provider }}' \
-          --test-subdirs '${{ inputs.test-subdirs }}' \
-          --test-pattern '${{ inputs.test-pattern }}' \
-          --inference-mode '${{ inputs.inference-mode }}' \
-          --test-suite '${{ inputs.test-suite }}' \
-          | tee pytest-${{ inputs.inference-mode }}.log
+        SCRIPT_ARGS="--stack-config ${{ inputs.stack-config }} --inference-mode ${{ inputs.inference-mode }}"
+
+        # Add optional arguments only if they are provided
+        if [ -n '${{ inputs.setup }}' ]; then
+          SCRIPT_ARGS="$SCRIPT_ARGS --setup ${{ inputs.setup }}"
+        fi
+        if [ -n '${{ inputs.suite }}' ]; then
+          SCRIPT_ARGS="$SCRIPT_ARGS --suite ${{ inputs.suite }}"
+        fi
+        if [ -n '${{ inputs.subdirs }}' ]; then
+          SCRIPT_ARGS="$SCRIPT_ARGS --subdirs ${{ inputs.subdirs }}"
+        fi
+        if [ -n '${{ inputs.pattern }}' ]; then
+          SCRIPT_ARGS="$SCRIPT_ARGS --pattern ${{ inputs.pattern }}"
+        fi
+
+        uv run --no-sync ./scripts/integration-tests.sh $SCRIPT_ARGS | tee pytest-${{ inputs.inference-mode }}.log
 
 
     - name: Commit and push recordings
@@ -58,7 +68,7 @@ runs:
           echo "New recordings detected, committing and pushing"
           git add tests/integration/recordings/
 
-          git commit -m "Recordings update from CI (test-suite: ${{ inputs.test-suite }})"
+          git commit -m "Recordings update from CI (suite: ${{ inputs.suite }})"
           git fetch origin ${{ github.ref_name }}
           git rebase origin/${{ github.ref_name }}
           echo "Rebased successfully"
diff --git a/.github/actions/setup-ollama/action.yml b/.github/actions/setup-ollama/action.yml
index dc2f87e8c..5c95d131d 100644
--- a/.github/actions/setup-ollama/action.yml
+++ b/.github/actions/setup-ollama/action.yml
@@ -1,7 +1,7 @@
 name: Setup Ollama
 description: Start Ollama
 inputs:
-  test-suite:
+  suite:
     description: 'Test suite to use: base, responses, vision, etc.'
     required: false
     default: ''
@@ -11,7 +11,7 @@ runs:
     - name: Start Ollama
       shell: bash
       run: |
-        if [ "${{ inputs.test-suite }}" == "vision" ]; then
+        if [ "${{ inputs.suite }}" == "vision" ]; then
           image="ollama-with-vision-model"
         else
           image="ollama-with-models"
diff --git a/.github/actions/setup-test-environment/action.yml b/.github/actions/setup-test-environment/action.yml
index 3be76f009..478e8f598 100644
--- a/.github/actions/setup-test-environment/action.yml
+++ b/.github/actions/setup-test-environment/action.yml
@@ -8,11 +8,11 @@ inputs:
   client-version:
     description: 'Client version (latest or published)'
     required: true
-  provider:
-    description: 'Provider to setup (ollama or vllm)'
-    required: true
+  setup:
+    description: 'Setup to configure (ollama, vllm, gpt, etc.)'
+    required: false
     default: 'ollama'
-  test-suite:
+  suite:
     description: 'Test suite to use: base, responses, vision, etc.'
     required: false
     default: ''
@@ -30,13 +30,13 @@ runs:
         client-version: ${{ inputs.client-version }}
 
     - name: Setup ollama
-      if: ${{ inputs.provider == 'ollama' && inputs.inference-mode == 'record' }}
+      if: ${{ (inputs.setup == 'ollama' || inputs.setup == 'ollama-vision') && inputs.inference-mode == 'record' }}
       uses: ./.github/actions/setup-ollama
       with:
-        test-suite: ${{ inputs.test-suite }}
+        suite: ${{ inputs.suite }}
 
     - name: Setup vllm
-      if: ${{ inputs.provider == 'vllm' && inputs.inference-mode == 'record' }}
+      if: ${{ inputs.setup == 'vllm' && inputs.inference-mode == 'record' }}
       uses: ./.github/actions/setup-vllm
 
     - name: Build Llama Stack
diff --git a/.github/workflows/integration-tests.yml b/.github/workflows/integration-tests.yml
index bb53eea2f..711eccd9e 100644
--- a/.github/workflows/integration-tests.yml
+++ b/.github/workflows/integration-tests.yml
@@ -28,8 +28,8 @@ on:
         description: 'Test against both the latest and published versions'
         type: boolean
         default: false
-      test-provider:
-        description: 'Test against a specific provider'
+      test-setup:
+        description: 'Test against a specific setup'
         type: string
         default: 'ollama'
 
@@ -42,18 +42,18 @@ jobs:
 
   run-replay-mode-tests:
     runs-on: ubuntu-latest
-    name: ${{ format('Integration Tests ({0}, {1}, {2}, client={3}, {4})', matrix.client-type, matrix.provider, matrix.python-version, matrix.client-version, matrix.test-suite) }}
+    name: ${{ format('Integration Tests ({0}, {1}, {2}, client={3}, {4})', matrix.client-type, matrix.setup, matrix.python-version, matrix.client-version, matrix.suite) }}
 
     strategy:
       fail-fast: false
       matrix:
         client-type: [library, server]
-        # Use vllm on weekly schedule, otherwise use test-provider input (defaults to ollama)
-        provider: ${{ (github.event.schedule == '1 0 * * 0') && fromJSON('["vllm"]') || fromJSON(format('["{0}"]', github.event.inputs.test-provider || 'ollama')) }}
+        # Use vllm on weekly schedule, otherwise use test-setup input (defaults to ollama)
+        setup: ${{ (github.event.schedule == '1 0 * * 0') && fromJSON('["vllm"]') || fromJSON(format('["{0}"]', github.event.inputs.test-setup || 'ollama')) }}
         # Use Python 3.13 only on nightly schedule (daily latest client test), otherwise use 3.12
         python-version: ${{ github.event.schedule == '0 0 * * *' && fromJSON('["3.12", "3.13"]') || fromJSON('["3.12"]') }}
         client-version: ${{ (github.event.schedule == '0 0 * * *' || github.event.inputs.test-all-client-versions == 'true') && fromJSON('["published", "latest"]') || fromJSON('["latest"]') }}
-        test-suite: [base, vision]
+        suite: [base, vision]
 
     steps:
       - name: Checkout repository
@@ -64,14 +64,14 @@ jobs:
         with:
           python-version: ${{ matrix.python-version }}
           client-version: ${{ matrix.client-version }}
-          provider: ${{ matrix.provider }}
-          test-suite: ${{ matrix.test-suite }}
+          setup: ${{ matrix.setup }}
+          suite: ${{ matrix.suite }}
           inference-mode: 'replay'
 
       - name: Run tests
         uses: ./.github/actions/run-and-record-tests
         with:
           stack-config: ${{ matrix.client-type == 'library' && 'ci-tests' || 'server:ci-tests' }}
-          provider: ${{ matrix.provider }}
+          setup: ${{ matrix.setup }}
           inference-mode: 'replay'
-          test-suite: ${{ matrix.test-suite }}
+          suite: ${{ matrix.suite }}
diff --git a/.github/workflows/record-integration-tests.yml b/.github/workflows/record-integration-tests.yml
index 01797a54b..65a04f125 100644
--- a/.github/workflows/record-integration-tests.yml
+++ b/.github/workflows/record-integration-tests.yml
@@ -10,19 +10,19 @@ run-name: Run the integration test suite from tests/integration
 on:
   workflow_dispatch:
     inputs:
-      test-provider:
-        description: 'Test against a specific provider'
+      test-setup:
+        description: 'Test against a specific setup'
         type: string
         default: 'ollama'
-      test-suite:
+      suite:
         description: 'Test suite to use: base, responses, vision, etc.'
         type: string
         default: ''
-      test-subdirs:
-        description: 'Comma-separated list of test subdirectories to run; overrides test-suite'
+      subdirs:
+        description: 'Comma-separated list of test subdirectories to run; overrides suite'
         type: string
         default: ''
-      test-pattern:
+      pattern:
         description: 'Regex pattern to pass to pytest -k'
         type: string
         default: ''
@@ -39,10 +39,10 @@ jobs:
         run: |
           echo "::group::Workflow Inputs"
           echo "branch: ${{ github.ref_name }}"
-          echo "test-provider: ${{ inputs.test-provider }}"
-          echo "test-suite: ${{ inputs.test-suite }}"
-          echo "test-subdirs: ${{ inputs.test-subdirs }}"
-          echo "test-pattern: ${{ inputs.test-pattern }}"
+          echo "test-setup: ${{ inputs.test-setup }}"
+          echo "suite: ${{ inputs.suite }}"
+          echo "subdirs: ${{ inputs.subdirs }}"
+          echo "pattern: ${{ inputs.pattern }}"
           echo "::endgroup::"
 
       - name: Checkout repository
@@ -55,16 +55,16 @@ jobs:
         with:
           python-version: "3.12"  # Use single Python version for recording
           client-version: "latest"
-          provider: ${{ inputs.test-provider || 'ollama' }}
-          test-suite: ${{ inputs.test-suite }}
+          setup: ${{ inputs.test-setup || 'ollama' }}
+          suite: ${{ inputs.suite }}
           inference-mode: 'record'
 
       - name: Run and record tests
         uses: ./.github/actions/run-and-record-tests
         with:
           stack-config: 'server:ci-tests'  # recording must be done with server since more tests are run
-          provider: ${{ inputs.test-provider || 'ollama' }}
+          setup: ${{ inputs.test-setup || 'ollama' }}
           inference-mode: 'record'
-          test-suite: ${{ inputs.test-suite }}
-          test-subdirs: ${{ inputs.test-subdirs }}
-          test-pattern: ${{ inputs.test-pattern }}
+          suite: ${{ inputs.suite }}
+          subdirs: ${{ inputs.subdirs }}
+          pattern: ${{ inputs.pattern }}
diff --git a/scripts/get_setup_env.py b/scripts/get_setup_env.py
new file mode 100644
index 000000000..fad601e76
--- /dev/null
+++ b/scripts/get_setup_env.py
@@ -0,0 +1,71 @@
+#!/usr/bin/env python3
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+"""
+Small helper script to extract environment variables from a test setup.
+Used by integration-tests.sh to set environment variables before starting the server.
+"""
+
+import argparse
+import sys
+
+from tests.integration.suites import SETUP_DEFINITIONS, SUITE_DEFINITIONS
+
+
+def get_setup_env_vars(setup_name, suite_name=None):
+    """
+    Get environment variables for a setup, with optional suite default fallback.
+
+    Args:
+        setup_name: Name of the setup (e.g., 'ollama', 'gpt')
+        suite_name: Optional suite name to get default setup if setup_name is None
+
+    Returns:
+        Dictionary of environment variables
+    """
+    # If no setup specified, try to get default from suite
+    if not setup_name and suite_name:
+        suite = SUITE_DEFINITIONS.get(suite_name)
+        if suite and suite.default_setup:
+            setup_name = suite.default_setup
+
+    if not setup_name:
+        return {}
+
+    setup = SETUP_DEFINITIONS.get(setup_name)
+    if not setup:
+        print(
+            f"Error: Unknown setup '{setup_name}'. Available: {', '.join(sorted(SETUP_DEFINITIONS.keys()))}",
+            file=sys.stderr,
+        )
+        sys.exit(1)
+
+    return setup.env
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Extract environment variables from a test setup")
+    parser.add_argument("--setup", help="Setup name (e.g., ollama, gpt)")
+    parser.add_argument("--suite", help="Suite name to get default setup from if --setup not provided")
+    parser.add_argument("--format", choices=["bash", "json"], default="bash", help="Output format (default: bash)")
+
+    args = parser.parse_args()
+
+    env_vars = get_setup_env_vars(args.setup, args.suite)
+
+    if args.format == "bash":
+        # Output as bash export statements
+        for key, value in env_vars.items():
+            print(f"export {key}='{value}'")
+    elif args.format == "json":
+        import json
+
+        print(json.dumps(env_vars))
+
+
+if __name__ == "__main__":
+    main()
diff --git a/scripts/github/schedule-record-workflow.sh b/scripts/github/schedule-record-workflow.sh
index 09e055611..c292e53e6 100755
--- a/scripts/github/schedule-record-workflow.sh
+++ b/scripts/github/schedule-record-workflow.sh
@@ -14,7 +14,7 @@ set -euo pipefail
 # Default values
 BRANCH=""
 TEST_SUBDIRS=""
-TEST_PROVIDER="ollama"
+TEST_SETUP="ollama"
 TEST_SUITE="base"
 TEST_PATTERN=""
 
@@ -27,24 +27,24 @@ Trigger the integration test recording workflow remotely. This way you do not ne
 
 OPTIONS:
     -b, --branch BRANCH         Branch to run the workflow on (defaults to current branch)
-    -p, --test-provider PROVIDER Test provider to use: vllm or ollama (default: ollama)
-    -t, --test-suite SUITE      Test suite to use: base, responses, vision, etc. (default: base)
-    -s, --test-subdirs DIRS     Comma-separated list of test subdirectories to run (overrides suite)
-    -k, --test-pattern PATTERN  Regex pattern to pass to pytest -k
+    -t, --suite SUITE           Test suite to use: base, responses, vision, etc. (default: base)
+    -p, --setup SETUP           Test setup to use: vllm, ollama, gpt, etc. (default: ollama)
+    -s, --subdirs DIRS          Comma-separated list of test subdirectories to run (overrides suite)
+    -k, --pattern PATTERN       Regex pattern to pass to pytest -k
     -h, --help                  Show this help message
 
 EXAMPLES:
     # Record tests for current branch with agents subdirectory
-    $0 --test-subdirs "agents"
+    $0 --subdirs "agents"
 
     # Record tests for specific branch with vision tests
-    $0 -b my-feature-branch --test-suite vision
+    $0 -b my-feature-branch --suite vision
 
-    # Record multiple test subdirectories with specific provider
-    $0 --test-subdirs "agents,inference" --test-provider vllm
+    # Record multiple test subdirectories with specific setup
+    $0 --subdirs "agents,inference" --setup vllm
 
     # Record tests matching a specific pattern
-    $0 --test-subdirs "inference" --test-pattern "test_streaming"
+    $0 --subdirs "inference" --pattern "test_streaming"
 
 EOF
 }
@@ -63,19 +63,19 @@ while [[ $# -gt 0 ]]; do
             BRANCH="$2"
             shift 2
             ;;
-        -s|--test-subdirs)
+        -s|--subdirs)
             TEST_SUBDIRS="$2"
             shift 2
             ;;
-        -p|--test-provider)
-            TEST_PROVIDER="$2"
+        -p|--setup)
+            TEST_SETUP="$2"
             shift 2
             ;;
-        -t|--test-suite)
+        -t|--suite)
             TEST_SUITE="$2"
             shift 2
             ;;
-        -k|--test-pattern)
+        -k|--pattern)
             TEST_PATTERN="$2"
             shift 2
             ;;
@@ -93,21 +93,16 @@ done
 
 # Validate required parameters
 if [[ -z "$TEST_SUBDIRS" && -z "$TEST_SUITE" ]]; then
-    echo "Error: --test-subdirs or --test-suite is required"
+    echo "Error: --subdirs or --suite is required"
     echo "Please specify which test subdirectories to run or test suite to use, e.g.:"
-    echo "  $0 --test-subdirs \"agents,inference\""
-    echo "  $0 --test-suite vision"
+    echo "  $0 --subdirs \"agents,inference\""
+    echo "  $0 --suite vision"
     echo ""
     exit 1
 fi
 
-# Validate test provider
-if [[ "$TEST_PROVIDER" != "vllm" && "$TEST_PROVIDER" != "ollama" ]]; then
-    echo "❌ Error: Invalid test provider '$TEST_PROVIDER'"
-    echo "   Supported providers: vllm, ollama"
-    echo "   Example: $0 --test-subdirs \"agents\" --test-provider vllm"
-    exit 1
-fi
+# Validate test setup (optional - setups are validated by the workflow itself)
+# Common setups: ollama, vllm, gpt, etc.
 
 # Check if required tools are installed
 if ! command -v gh &> /dev/null; then
@@ -237,7 +232,7 @@ fi
 # Build the workflow dispatch command
 echo "Triggering integration test recording workflow..."
 echo "Branch: $BRANCH"
-echo "Test provider: $TEST_PROVIDER"
+echo "Test setup: $TEST_SETUP"
 echo "Test subdirs: $TEST_SUBDIRS"
 echo "Test suite: $TEST_SUITE"
 echo "Test pattern: ${TEST_PATTERN:-"(none)"}"
@@ -245,16 +240,16 @@ echo ""
 
 # Prepare inputs for gh workflow run
 if [[ -n "$TEST_SUBDIRS" ]]; then
-    INPUTS="-f test-subdirs='$TEST_SUBDIRS'"
+    INPUTS="-f subdirs='$TEST_SUBDIRS'"
 fi
-if [[ -n "$TEST_PROVIDER" ]]; then
-    INPUTS="$INPUTS -f test-provider='$TEST_PROVIDER'"
+if [[ -n "$TEST_SETUP" ]]; then
+    INPUTS="$INPUTS -f test-setup='$TEST_SETUP'"
 fi
 if [[ -n "$TEST_SUITE" ]]; then
-    INPUTS="$INPUTS -f test-suite='$TEST_SUITE'"
+    INPUTS="$INPUTS -f suite='$TEST_SUITE'"
 fi
 if [[ -n "$TEST_PATTERN" ]]; then
-    INPUTS="$INPUTS -f test-pattern='$TEST_PATTERN'"
+    INPUTS="$INPUTS -f pattern='$TEST_PATTERN'"
 fi
 
 # Run the workflow
diff --git a/scripts/integration-tests.sh b/scripts/integration-tests.sh
index ab7e37579..eee60951d 100755
--- a/scripts/integration-tests.sh
+++ b/scripts/integration-tests.sh
@@ -13,10 +13,10 @@ set -euo pipefail
 
 # Default values
 STACK_CONFIG=""
-PROVIDER=""
+TEST_SUITE="base"
+TEST_SETUP=""
 TEST_SUBDIRS=""
 TEST_PATTERN=""
-TEST_SUITE="base"
 INFERENCE_MODE="replay"
 EXTRA_PARAMS=""
 
@@ -27,29 +27,30 @@ Usage: $0 [OPTIONS]
 
 Options:
     --stack-config STRING    Stack configuration to use (required)
-    --provider STRING        Provider to use (ollama, vllm, etc.) (required)
-    --test-suite STRING      Comma-separated list of test suites to run (default: 'base')
+    --suite STRING           Test suite to run (default: 'base')
+    --setup STRING           Test setup (models, env) to use (e.g., 'ollama', 'ollama-vision', 'gpt', 'vllm')
     --inference-mode STRING  Inference mode: record or replay (default: replay)
-    --test-subdirs STRING    Comma-separated list of test subdirectories to run (overrides suite)
-    --test-pattern STRING    Regex pattern to pass to pytest -k
+    --subdirs STRING         Comma-separated list of test subdirectories to run (overrides suite)
+    --pattern STRING         Regex pattern to pass to pytest -k
     --help                   Show this help message
 
-Suites are defined in tests/integration/suites.py. They are used to narrow the collection of tests and provide default model options.
+Suites are defined in tests/integration/suites.py and define which tests to run.
+Setups are defined in tests/integration/setups.py and provide global configuration (models, env).
 
 You can also specify subdirectories (of tests/integration) to select tests from, which will override the suite.
 
 Examples:
     # Basic inference tests with ollama
-    $0 --stack-config server:ci-tests --provider ollama
+    $0 --stack-config server:ci-tests --suite base --setup ollama
 
     # Multiple test directories with vllm
-    $0 --stack-config server:ci-tests --provider vllm --test-subdirs 'inference,agents'
+    $0 --stack-config server:ci-tests --subdirs 'inference,agents' --setup vllm
 
     # Vision tests with ollama
-    $0 --stack-config server:ci-tests --provider ollama --test-suite vision
+    $0 --stack-config server:ci-tests --suite vision  # default setup for this suite is ollama-vision
 
     # Record mode for updating test recordings
-    $0 --stack-config server:ci-tests --provider ollama --inference-mode record
+    $0 --stack-config server:ci-tests --suite base --inference-mode record
 EOF
 }
 
@@ -60,15 +61,15 @@ while [[ $# -gt 0 ]]; do
             STACK_CONFIG="$2"
             shift 2
             ;;
-        --provider)
-            PROVIDER="$2"
+        --setup)
+            TEST_SETUP="$2"
             shift 2
             ;;
-        --test-subdirs)
+        --subdirs)
             TEST_SUBDIRS="$2"
             shift 2
             ;;
-        --test-suite)
+        --suite)
             TEST_SUITE="$2"
             shift 2
             ;;
@@ -76,7 +77,7 @@ while [[ $# -gt 0 ]]; do
             INFERENCE_MODE="$2"
             shift 2
             ;;
-        --test-pattern)
+        --pattern)
             TEST_PATTERN="$2"
             shift 2
             ;;
@@ -96,11 +97,13 @@ done
 # Validate required parameters
 if [[ -z "$STACK_CONFIG" ]]; then
     echo "Error: --stack-config is required"
+    usage
     exit 1
 fi
 
-if [[ -z "$PROVIDER" ]]; then
-    echo "Error: --provider is required"
+if [[ -z "$TEST_SETUP" && -n "$TEST_SUBDIRS" ]]; then
+    echo "Error: --test-setup is required when --test-subdirs is provided"
+    usage
     exit 1
 fi
 
@@ -111,7 +114,7 @@ fi
 
 echo "=== Llama Stack Integration Test Runner ==="
 echo "Stack Config: $STACK_CONFIG"
-echo "Provider: $PROVIDER"
+echo "Setup: $TEST_SETUP"
 echo "Inference Mode: $INFERENCE_MODE"
 echo "Test Suite: $TEST_SUITE"
 echo "Test Subdirs: $TEST_SUBDIRS"
@@ -129,21 +132,25 @@ echo ""
 
 # Set environment variables
 export LLAMA_STACK_CLIENT_TIMEOUT=300
-export LLAMA_STACK_TEST_INFERENCE_MODE="$INFERENCE_MODE"
-
-# Configure provider-specific settings
-if [[ "$PROVIDER" == "ollama" ]]; then
-    export OLLAMA_URL="http://0.0.0.0:11434"
-    export TEXT_MODEL="ollama/llama3.2:3b-instruct-fp16"
-    export SAFETY_MODEL="ollama/llama-guard3:1b"
-    EXTRA_PARAMS="--safety-shield=llama-guard"
-else
-    export VLLM_URL="http://localhost:8000/v1"
-    export TEXT_MODEL="vllm/meta-llama/Llama-3.2-1B-Instruct"
-    EXTRA_PARAMS=""
-fi
 
 THIS_DIR=$(dirname "$0")
+
+if [[ -n "$TEST_SETUP" ]]; then
+    EXTRA_PARAMS="--setup=$TEST_SETUP"
+fi
+
+# Apply setup-specific environment variables (needed for server startup and tests)
+echo "=== Applying Setup Environment Variables ==="
+
+# the server needs this
+export LLAMA_STACK_TEST_INFERENCE_MODE="$INFERENCE_MODE"
+
+SETUP_ENV=$(PYTHONPATH=$THIS_DIR/.. python "$THIS_DIR/get_setup_env.py" --suite "$TEST_SUITE" --setup "$TEST_SETUP" --format bash)
+echo "Setting up environment variables:"
+echo "$SETUP_ENV"
+eval "$SETUP_ENV"
+echo ""
+
 ROOT_DIR="$THIS_DIR/.."
 cd $ROOT_DIR
 
@@ -162,6 +169,18 @@ fi
 
 # Start Llama Stack Server if needed
 if [[ "$STACK_CONFIG" == *"server:"* ]]; then
+    stop_server() {
+        echo "Stopping Llama Stack Server..."
+        pids=$(lsof -i :8321 | awk 'NR>1 {print $2}')
+        if [[ -n "$pids" ]]; then
+            echo "Killing Llama Stack Server processes: $pids"
+            kill -9 $pids
+        else
+            echo "No Llama Stack Server processes found ?!"
+        fi
+        echo "Llama Stack Server stopped"
+    }
+
     # check if server is already running
     if curl -s http://localhost:8321/v1/health 2>/dev/null | grep -q "OK"; then
         echo "Llama Stack Server is already running, skipping start"
@@ -185,14 +204,16 @@ if [[ "$STACK_CONFIG" == *"server:"* ]]; then
         done
         echo ""
     fi
+
+    trap stop_server EXIT ERR INT TERM
 fi
 
 # Run tests
 echo "=== Running Integration Tests ==="
 EXCLUDE_TESTS="builtin_tool or safety_with_image or code_interpreter or test_rag"
 
-# Additional exclusions for vllm provider
-if [[ "$PROVIDER" == "vllm" ]]; then
+# Additional exclusions for vllm setup
+if [[ "$TEST_SETUP" == "vllm" ]]; then
     EXCLUDE_TESTS="${EXCLUDE_TESTS} or test_inference_store_tool_calls"
 fi
 
@@ -229,20 +250,22 @@ if [[ -n "$TEST_SUBDIRS" ]]; then
     echo "Total test files: $(echo $TEST_FILES | wc -w)"
 
     PYTEST_TARGET="$TEST_FILES"
-    EXTRA_PARAMS="$EXTRA_PARAMS --text-model=$TEXT_MODEL --embedding-model=sentence-transformers/all-MiniLM-L6-v2"
 else
     PYTEST_TARGET="tests/integration/"
     EXTRA_PARAMS="$EXTRA_PARAMS --suite=$TEST_SUITE"
 fi
 
 set +e
+set -x
 pytest -s -v $PYTEST_TARGET \
     --stack-config="$STACK_CONFIG" \
+    --inference-mode="$INFERENCE_MODE" \
     -k "$PYTEST_PATTERN" \
     $EXTRA_PARAMS \
     --color=yes \
     --capture=tee-sys
 exit_code=$?
+set +x
 set -e
 
 if [ $exit_code -eq 0 ]; then
@@ -260,18 +283,5 @@ echo "=== System Resources After Tests ==="
 free -h 2>/dev/null || echo "free command not available"
 df -h
 
-# stop server
-if [[ "$STACK_CONFIG" == *"server:"* ]]; then
-    echo "Stopping Llama Stack Server..."
-    pids=$(lsof -i :8321 | awk 'NR>1 {print $2}')
-    if [[ -n "$pids" ]]; then
-        echo "Killing Llama Stack Server processes: $pids"
-        kill -9 $pids
-    else
-        echo "No Llama Stack Server processes found ?!"
-    fi
-    echo "Llama Stack Server stopped"
-fi
-
 echo ""
 echo "=== Integration Tests Complete ==="
diff --git a/tests/integration/README.md b/tests/integration/README.md
index b05beeb98..467f97e02 100644
--- a/tests/integration/README.md
+++ b/tests/integration/README.md
@@ -6,9 +6,7 @@ Integration tests verify complete workflows across different providers using Lla
 
 ```bash
 # Run all integration tests with existing recordings
-LLAMA_STACK_TEST_INFERENCE_MODE=replay \
-  LLAMA_STACK_TEST_RECORDING_DIR=tests/integration/recordings \
-  uv run --group test \
+uv run --group test \
   pytest -sv tests/integration/ --stack-config=starter
 ```
 
@@ -42,25 +40,35 @@ Model parameters can be influenced by the following options:
 Each of these are comma-separated lists and can be used to generate multiple parameter combinations. Note that tests will be skipped
 if no model is specified.
 
-### Suites (fast selection + sane defaults)
+### Suites and Setups
 
-- `--suite`: comma-separated list of named suites that both narrow which tests are collected and prefill common model options (unless you pass them explicitly).
+- `--suite`: single named suite that narrows which tests are collected.
 - Available suites:
-  - `responses`: collects tests under `tests/integration/responses`; this is a separate suite because it needs a strong tool-calling model.
-  - `vision`: collects only `tests/integration/inference/test_vision_inference.py`; defaults `--vision-model=ollama/llama3.2-vision:11b`, `--embedding-model=sentence-transformers/all-MiniLM-L6-v2`.
-- Explicit flags always win. For example, `--suite=responses --text-model=<X>` overrides the suite’s text model.
+  - `base`: collects most tests (excludes responses and post_training)
+  - `responses`: collects tests under `tests/integration/responses` (needs strong tool-calling models)
+  - `vision`: collects only `tests/integration/inference/test_vision_inference.py`
+- `--setup`: global configuration that can be used with any suite. Setups prefill model/env defaults; explicit CLI flags always win.
+  - Available setups:
+    - `ollama`: Local Ollama provider with lightweight models (sets OLLAMA_URL, uses llama3.2:3b-instruct-fp16)
+    - `vllm`: VLLM provider for efficient local inference (sets VLLM_URL, uses Llama-3.2-1B-Instruct)
+    - `gpt`: OpenAI GPT models for high-quality responses (uses gpt-4o)
+    - `claude`: Anthropic Claude models for high-quality responses (uses claude-3-5-sonnet)
 
-Examples:
+Examples
 
 ```bash
-# Fast responses run with defaults
-pytest -s -v tests/integration --stack-config=server:starter --suite=responses
+# Fast responses run with a strong tool-calling model
+pytest -s -v tests/integration --stack-config=server:starter --suite=responses --setup=gpt
 
-# Fast single-file vision run with defaults
-pytest -s -v tests/integration --stack-config=server:starter --suite=vision
+# Fast single-file vision run with Ollama defaults
+pytest -s -v tests/integration --stack-config=server:starter --suite=vision --setup=ollama
 
-# Combine suites and override a default
-pytest -s -v tests/integration --stack-config=server:starter --suite=responses,vision --embedding-model=text-embedding-3-small
+# Base suite with VLLM for performance
+pytest -s -v tests/integration --stack-config=server:starter --suite=base --setup=vllm
+
+# Override a default from setup
+pytest -s -v tests/integration --stack-config=server:starter \
+  --suite=responses --setup=gpt --embedding-model=text-embedding-3-small
 ```
 
 ## Examples
@@ -127,14 +135,13 @@ pytest tests/integration/
 ### RECORD Mode
 Captures API interactions for later replay:
 ```bash
-LLAMA_STACK_TEST_INFERENCE_MODE=record \
-pytest tests/integration/inference/test_new_feature.py
+pytest tests/integration/inference/test_new_feature.py --inference-mode=record
 ```
 
 ### LIVE Mode
 Tests make real API calls (but not recorded):
 ```bash
-LLAMA_STACK_TEST_INFERENCE_MODE=live pytest tests/integration/
+pytest tests/integration/ --inference-mode=live
 ```
 
 By default, the recording directory is `tests/integration/recordings`. You can override this by setting the `LLAMA_STACK_TEST_RECORDING_DIR` environment variable.
@@ -155,15 +162,14 @@ cat recordings/responses/abc123.json | jq '.'
 #### Remote Re-recording (Recommended)
 Use the automated workflow script for easier re-recording:
 ```bash
-./scripts/github/schedule-record-workflow.sh --test-subdirs "inference,agents"
+./scripts/github/schedule-record-workflow.sh --subdirs "inference,agents"
 ```
 See the [main testing guide](../README.md#remote-re-recording-recommended) for full details.
 
 #### Local Re-recording
 ```bash
 # Re-record specific tests
-LLAMA_STACK_TEST_INFERENCE_MODE=record \
-pytest -s -v --stack-config=server:starter tests/integration/inference/test_modified.py
+pytest -s -v --stack-config=server:starter tests/integration/inference/test_modified.py --inference-mode=record
 ```
 
 Note that when re-recording tests, you must use a Stack pointing to a server (i.e., `server:starter`). This subtlety exists because the set of tests run in server are a superset of the set of tests run in the library client.
diff --git a/tests/integration/conftest.py b/tests/integration/conftest.py
index 96260fdb7..4735264c3 100644
--- a/tests/integration/conftest.py
+++ b/tests/integration/conftest.py
@@ -15,7 +15,7 @@ from dotenv import load_dotenv
 
 from llama_stack.log import get_logger
 
-from .suites import SUITE_DEFINITIONS
+from .suites import SETUP_DEFINITIONS, SUITE_DEFINITIONS
 
 logger = get_logger(__name__, category="tests")
 
@@ -63,19 +63,33 @@ def pytest_configure(config):
         key, value = env_var.split("=", 1)
         os.environ[key] = value
 
-    suites_raw = config.getoption("--suite")
-    suites: list[str] = []
-    if suites_raw:
-        suites = [p.strip() for p in str(suites_raw).split(",") if p.strip()]
-        unknown = [p for p in suites if p not in SUITE_DEFINITIONS]
-        if unknown:
+    inference_mode = config.getoption("--inference-mode")
+    os.environ["LLAMA_STACK_TEST_INFERENCE_MODE"] = inference_mode
+
+    suite = config.getoption("--suite")
+    if suite:
+        if suite not in SUITE_DEFINITIONS:
+            raise pytest.UsageError(f"Unknown suite: {suite}. Available: {', '.join(sorted(SUITE_DEFINITIONS.keys()))}")
+
+    # Apply setups (global parameterizations): env + defaults
+    setup = config.getoption("--setup")
+    if suite and not setup:
+        setup = SUITE_DEFINITIONS[suite].default_setup
+
+    if setup:
+        if setup not in SETUP_DEFINITIONS:
             raise pytest.UsageError(
-                f"Unknown suite(s): {', '.join(unknown)}. Available: {', '.join(sorted(SUITE_DEFINITIONS.keys()))}"
+                f"Unknown setup '{setup}'. Available: {', '.join(sorted(SETUP_DEFINITIONS.keys()))}"
             )
-    for suite in suites:
-        suite_def = SUITE_DEFINITIONS.get(suite, {})
-        defaults: dict = suite_def.get("defaults", {})
-        for dest, value in defaults.items():
+
+        setup_obj = SETUP_DEFINITIONS[setup]
+        logger.info(f"Applying setup '{setup}'{' for suite ' + suite if suite else ''}")
+        # Apply env first
+        for k, v in setup_obj.env.items():
+            if k not in os.environ:
+                os.environ[k] = str(v)
+        # Apply defaults if not provided explicitly
+        for dest, value in setup_obj.defaults.items():
             current = getattr(config.option, dest, None)
             if not current:
                 setattr(config.option, dest, value)
@@ -120,6 +134,13 @@ def pytest_addoption(parser):
         default=384,
         help="Output dimensionality of the embedding model to use for testing. Default: 384",
     )
+
+    parser.addoption(
+        "--inference-mode",
+        help="Inference mode: { record, replay, live } (default: replay)",
+        choices=["record", "replay", "live"],
+        default="replay",
+    )
     parser.addoption(
         "--report",
         help="Path where the test report should be written, e.g. --report=/path/to/report.md",
@@ -127,14 +148,18 @@ def pytest_addoption(parser):
 
     available_suites = ", ".join(sorted(SUITE_DEFINITIONS.keys()))
     suite_help = (
-        "Comma-separated integration test suites to narrow collection and prefill defaults. "
-        "Available: "
-        f"{available_suites}. "
-        "Explicit CLI flags (e.g., --text-model) override suite defaults. "
-        "Examples: --suite=responses or --suite=responses,vision."
+        f"Single test suite to run (narrows collection). Available: {available_suites}. Example: --suite=responses"
     )
     parser.addoption("--suite", help=suite_help)
 
+    # Global setups for any suite
+    available_setups = ", ".join(sorted(SETUP_DEFINITIONS.keys()))
+    setup_help = (
+        f"Global test setup configuration. Available: {available_setups}. "
+        "Can be used with any suite. Example: --setup=ollama"
+    )
+    parser.addoption("--setup", help=setup_help)
+
 
 MODEL_SHORT_IDS = {
     "meta-llama/Llama-3.2-3B-Instruct": "3B",
@@ -221,16 +246,12 @@ pytest_plugins = ["tests.integration.fixtures.common"]
 
 def pytest_ignore_collect(path: str, config: pytest.Config) -> bool:
     """Skip collecting paths outside the selected suite roots for speed."""
-    suites_raw = config.getoption("--suite")
-    if not suites_raw:
+    suite = config.getoption("--suite")
+    if not suite:
         return False
 
-    names = [p.strip() for p in str(suites_raw).split(",") if p.strip()]
-    roots: list[str] = []
-    for name in names:
-        suite_def = SUITE_DEFINITIONS.get(name)
-        if suite_def:
-            roots.extend(suite_def.get("roots", []))
+    sobj = SUITE_DEFINITIONS.get(suite)
+    roots: list[str] = sobj.get("roots", []) if isinstance(sobj, dict) else getattr(sobj, "roots", [])
     if not roots:
         return False
 
diff --git a/tests/integration/suites.py b/tests/integration/suites.py
index 602855055..bacd7ef52 100644
--- a/tests/integration/suites.py
+++ b/tests/integration/suites.py
@@ -8,46 +8,112 @@
 # For example:
 #
 # ```bash
-# pytest tests/integration/ --suite=vision
+# pytest tests/integration/ --suite=vision --setup=ollama
 # ```
 #
-# Each suite can:
-# - restrict collection to specific roots (dirs or files)
-# - provide default CLI option values (e.g. text_model, embedding_model, etc.)
+"""
+Each suite defines what to run (roots). Suites can be run with different global setups defined in setups.py.
+Setups provide environment variables and model defaults that can be reused across multiple suites.
+
+CLI examples:
+  pytest tests/integration --suite=responses --setup=gpt
+  pytest tests/integration --suite=vision --setup=ollama
+  pytest tests/integration --suite=base --setup=vllm
+"""
 
 from pathlib import Path
 
+from pydantic import BaseModel, Field
+
 this_dir = Path(__file__).parent
-default_roots = [
+
+
+class Suite(BaseModel):
+    name: str
+    roots: list[str]
+    default_setup: str | None = None
+
+
+class Setup(BaseModel):
+    """A reusable test configuration with environment and CLI defaults."""
+
+    name: str
+    description: str
+    defaults: dict[str, str] = Field(default_factory=dict)
+    env: dict[str, str] = Field(default_factory=dict)
+
+
+# Global setups - can be used with any suite "technically" but in reality, some setups might work
+# only for specific test suites.
+SETUP_DEFINITIONS: dict[str, Setup] = {
+    "ollama": Setup(
+        name="ollama",
+        description="Local Ollama provider with text + safety models",
+        env={
+            "OLLAMA_URL": "http://0.0.0.0:11434",
+            "SAFETY_MODEL": "ollama/llama-guard3:1b",
+        },
+        defaults={
+            "text_model": "ollama/llama3.2:3b-instruct-fp16",
+            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
+            "safety_model": "ollama/llama-guard3:1b",
+            "safety_shield": "llama-guard",
+        },
+    ),
+    "ollama-vision": Setup(
+        name="ollama",
+        description="Local Ollama provider with a vision model",
+        env={
+            "OLLAMA_URL": "http://0.0.0.0:11434",
+        },
+        defaults={
+            "vision_model": "ollama/llama3.2-vision:11b",
+            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
+        },
+    ),
+    "vllm": Setup(
+        name="vllm",
+        description="vLLM provider with a text model",
+        env={
+            "VLLM_URL": "http://localhost:8000/v1",
+        },
+        defaults={
+            "text_model": "vllm/meta-llama/Llama-3.2-1B-Instruct",
+            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
+        },
+    ),
+    "gpt": Setup(
+        name="gpt",
+        description="OpenAI GPT models for high-quality responses and tool calling",
+        defaults={
+            "text_model": "openai/gpt-4o",
+            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
+        },
+    ),
+}
+
+
+base_roots = [
     str(p)
     for p in this_dir.glob("*")
     if p.is_dir()
     and p.name not in ("__pycache__", "fixtures", "test_cases", "recordings", "responses", "post_training")
 ]
 
-SUITE_DEFINITIONS: dict[str, dict] = {
-    "base": {
-        "description": "Base suite that includes most tests but runs them with a text Ollama model",
-        "roots": default_roots,
-        "defaults": {
-            "text_model": "ollama/llama3.2:3b-instruct-fp16",
-            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
-        },
-    },
-    "responses": {
-        "description": "Suite that includes only the OpenAI Responses tests; needs a strong tool-calling model",
-        "roots": ["tests/integration/responses"],
-        "defaults": {
-            "text_model": "openai/gpt-4o",
-            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
-        },
-    },
-    "vision": {
-        "description": "Suite that includes only the vision tests",
-        "roots": ["tests/integration/inference/test_vision_inference.py"],
-        "defaults": {
-            "vision_model": "ollama/llama3.2-vision:11b",
-            "embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
-        },
-    },
+SUITE_DEFINITIONS: dict[str, Suite] = {
+    "base": Suite(
+        name="base",
+        roots=base_roots,
+        default_setup="ollama",
+    ),
+    "responses": Suite(
+        name="responses",
+        roots=["tests/integration/responses"],
+        default_setup="gpt",
+    ),
+    "vision": Suite(
+        name="vision",
+        roots=["tests/integration/inference/test_vision_inference.py"],
+        default_setup="ollama-vision",
+    ),
 }

From 9d3a234bf3772083e148d8168a204b9cb2c200ac Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Tue, 9 Sep 2025 15:51:20 -0700
Subject: [PATCH 49/76] chore: remove unused variable (#3389)

# What does this PR do?


## Test Plan
---
 llama_stack/core/library_client.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/llama_stack/core/library_client.py b/llama_stack/core/library_client.py
index 9e7a8006c..ea5a2ac8e 100644
--- a/llama_stack/core/library_client.py
+++ b/llama_stack/core/library_client.py
@@ -10,7 +10,6 @@ import json
 import logging  # allow-direct-logging
 import os
 import sys
-from concurrent.futures import ThreadPoolExecutor
 from enum import Enum
 from io import BytesIO
 from pathlib import Path
@@ -148,7 +147,6 @@ class LlamaStackAsLibraryClient(LlamaStackClient):
         self.async_client = AsyncLlamaStackAsLibraryClient(
             config_path_or_distro_name, custom_provider_registry, provider_data, skip_logger_removal
         )
-        self.pool_executor = ThreadPoolExecutor(max_workers=4)
         self.provider_data = provider_data
 
         self.loop = asyncio.new_event_loop()

From dd1f946b3ee4232dc8e13d3836e7f19e65f5e112 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Tue, 9 Sep 2025 18:54:58 -0400
Subject: [PATCH 50/76] feat: include a default inference store during llama
 stack build (#3373)

# What does this PR do?

enables completions storage when using `llama stack build --providers` -
 - GET /v1/chat/completions
 - GET /v1/chat/completions/{id}

todo: llama stack build and distro codegen should use the same code
paths

## Test Plan

ci
---
 llama_stack/cli/stack/_build.py | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/llama_stack/cli/stack/_build.py b/llama_stack/cli/stack/_build.py
index c6e204773..b14e6fe55 100644
--- a/llama_stack/cli/stack/_build.py
+++ b/llama_stack/cli/stack/_build.py
@@ -45,6 +45,7 @@ from llama_stack.core.utils.dynamic import instantiate_class_type
 from llama_stack.core.utils.exec import formulate_run_args, run_command
 from llama_stack.core.utils.image_types import LlamaStackImageType
 from llama_stack.providers.datatypes import Api
+from llama_stack.providers.utils.sqlstore.sqlstore import SqliteSqlStoreConfig
 
 DISTRIBS_PATH = Path(__file__).parent.parent.parent / "distributions"
 
@@ -294,6 +295,12 @@ def _generate_run_config(
         if build_config.external_providers_dir
         else EXTERNAL_PROVIDERS_DIR,
     )
+    if not run_config.inference_store:
+        run_config.inference_store = SqliteSqlStoreConfig(
+            **SqliteSqlStoreConfig.sample_run_config(
+                __distro_dir__=(DISTRIBS_BASE_DIR / image_name).as_posix(), db_name="inference_store.db"
+            )
+        )
     # build providers dict
     provider_registry = get_provider_registry(build_config)
     for api in apis:

From 81ad240faa48d2a2d91e5fbfc3dda21443432a6f Mon Sep 17 00:00:00 2001
From: Ashwin Bharambe <ashwin.bharambe@gmail.com>
Date: Tue, 9 Sep 2025 23:00:50 -0700
Subject: [PATCH 51/76] fix(k8s): unwedge run.yaml to add files

---
 .../k8s-benchmark/stack-configmap.yaml        |  19 +-
 .../k8s-benchmark/stack_run_config.yaml       |   9 +
 .../distributions/k8s/stack-configmap.yaml    | 182 +++++-------------
 .../distributions/k8s/stack_run_config.yaml   |   9 +
 4 files changed, 77 insertions(+), 142 deletions(-)

diff --git a/docs/source/distributions/k8s-benchmark/stack-configmap.yaml b/docs/source/distributions/k8s-benchmark/stack-configmap.yaml
index edf4ebd75..bf6109b68 100644
--- a/docs/source/distributions/k8s-benchmark/stack-configmap.yaml
+++ b/docs/source/distributions/k8s-benchmark/stack-configmap.yaml
@@ -6,6 +6,7 @@ data:
     apis:
     - agents
     - inference
+    - files
     - safety
     - telemetry
     - tool_runtime
@@ -19,13 +20,6 @@ data:
           max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
           api_token: ${env.VLLM_API_TOKEN:=fake}
           tls_verify: ${env.VLLM_TLS_VERIFY:=true}
-      - provider_id: vllm-safety
-        provider_type: remote::vllm
-        config:
-          url: ${env.VLLM_SAFETY_URL:=http://localhost:8000/v1}
-          max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
-          api_token: ${env.VLLM_API_TOKEN:=fake}
-          tls_verify: ${env.VLLM_TLS_VERIFY:=true}
       - provider_id: sentence-transformers
         provider_type: inline::sentence-transformers
         config: {}
@@ -41,6 +35,14 @@ data:
             db: ${env.POSTGRES_DB:=llamastack}
             user: ${env.POSTGRES_USER:=llamastack}
             password: ${env.POSTGRES_PASSWORD:=llamastack}
+      files:
+      - provider_id: meta-reference-files
+        provider_type: inline::localfs
+        config:
+          storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
+          metadata_store:
+            type: sqlite
+            db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
       safety:
       - provider_id: llama-guard
         provider_type: inline::llama-guard
@@ -111,9 +113,6 @@ data:
     - model_id: ${env.INFERENCE_MODEL}
       provider_id: vllm-inference
       model_type: llm
-    - model_id: ${env.SAFETY_MODEL}
-      provider_id: vllm-safety
-      model_type: llm
     shields:
     - shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
     vector_dbs: []
diff --git a/docs/source/distributions/k8s-benchmark/stack_run_config.yaml b/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
index 5a810639e..f8ff7811b 100644
--- a/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
+++ b/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
@@ -3,6 +3,7 @@ image_name: kubernetes-benchmark-demo
 apis:
 - agents
 - inference
+- files
 - safety
 - telemetry
 - tool_runtime
@@ -31,6 +32,14 @@ providers:
         db: ${env.POSTGRES_DB:=llamastack}
         user: ${env.POSTGRES_USER:=llamastack}
         password: ${env.POSTGRES_PASSWORD:=llamastack}
+  files:
+  - provider_id: meta-reference-files
+    provider_type: inline::localfs
+    config:
+      storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
+      metadata_store:
+        type: sqlite
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
   safety:
   - provider_id: llama-guard
     provider_type: inline::llama-guard
diff --git a/docs/source/distributions/k8s/stack-configmap.yaml b/docs/source/distributions/k8s/stack-configmap.yaml
index 4f95554e3..3dbb0da97 100644
--- a/docs/source/distributions/k8s/stack-configmap.yaml
+++ b/docs/source/distributions/k8s/stack-configmap.yaml
@@ -1,137 +1,55 @@
 apiVersion: v1
 data:
-  stack_run_config.yaml: |
-    version: '2'
-    image_name: kubernetes-demo
-    apis:
-    - agents
-    - inference
-    - safety
-    - telemetry
-    - tool_runtime
-    - vector_io
-    providers:
-      inference:
-      - provider_id: vllm-inference
-        provider_type: remote::vllm
-        config:
-          url: ${env.VLLM_URL:=http://localhost:8000/v1}
-          max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
-          api_token: ${env.VLLM_API_TOKEN:=fake}
-          tls_verify: ${env.VLLM_TLS_VERIFY:=true}
-      - provider_id: vllm-safety
-        provider_type: remote::vllm
-        config:
-          url: ${env.VLLM_SAFETY_URL:=http://localhost:8000/v1}
-          max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
-          api_token: ${env.VLLM_API_TOKEN:=fake}
-          tls_verify: ${env.VLLM_TLS_VERIFY:=true}
-      - provider_id: sentence-transformers
-        provider_type: inline::sentence-transformers
-        config: {}
-      vector_io:
-      - provider_id: ${env.ENABLE_CHROMADB:+chromadb}
-        provider_type: remote::chromadb
-        config:
-          url: ${env.CHROMADB_URL:=}
-          kvstore:
-            type: postgres
-            host: ${env.POSTGRES_HOST:=localhost}
-            port: ${env.POSTGRES_PORT:=5432}
-            db: ${env.POSTGRES_DB:=llamastack}
-            user: ${env.POSTGRES_USER:=llamastack}
-            password: ${env.POSTGRES_PASSWORD:=llamastack}
-      safety:
-      - provider_id: llama-guard
-        provider_type: inline::llama-guard
-        config:
-          excluded_categories: []
-      agents:
-      - provider_id: meta-reference
-        provider_type: inline::meta-reference
-        config:
-          persistence_store:
-            type: postgres
-            host: ${env.POSTGRES_HOST:=localhost}
-            port: ${env.POSTGRES_PORT:=5432}
-            db: ${env.POSTGRES_DB:=llamastack}
-            user: ${env.POSTGRES_USER:=llamastack}
-            password: ${env.POSTGRES_PASSWORD:=llamastack}
-          responses_store:
-            type: postgres
-            host: ${env.POSTGRES_HOST:=localhost}
-            port: ${env.POSTGRES_PORT:=5432}
-            db: ${env.POSTGRES_DB:=llamastack}
-            user: ${env.POSTGRES_USER:=llamastack}
-            password: ${env.POSTGRES_PASSWORD:=llamastack}
-      telemetry:
-      - provider_id: meta-reference
-        provider_type: inline::meta-reference
-        config:
-          service_name: "${env.OTEL_SERVICE_NAME:=\u200B}"
-          sinks: ${env.TELEMETRY_SINKS:=console}
-      tool_runtime:
-      - provider_id: brave-search
-        provider_type: remote::brave-search
-        config:
-          api_key: ${env.BRAVE_SEARCH_API_KEY:+}
-          max_results: 3
-      - provider_id: tavily-search
-        provider_type: remote::tavily-search
-        config:
-          api_key: ${env.TAVILY_SEARCH_API_KEY:+}
-          max_results: 3
-      - provider_id: rag-runtime
-        provider_type: inline::rag-runtime
-        config: {}
-      - provider_id: model-context-protocol
-        provider_type: remote::model-context-protocol
-        config: {}
-    metadata_store:
-      type: postgres
-      host: ${env.POSTGRES_HOST:=localhost}
-      port: ${env.POSTGRES_PORT:=5432}
-      db: ${env.POSTGRES_DB:=llamastack}
-      user: ${env.POSTGRES_USER:=llamastack}
-      password: ${env.POSTGRES_PASSWORD:=llamastack}
-      table_name: llamastack_kvstore
-    inference_store:
-      type: postgres
-      host: ${env.POSTGRES_HOST:=localhost}
-      port: ${env.POSTGRES_PORT:=5432}
-      db: ${env.POSTGRES_DB:=llamastack}
-      user: ${env.POSTGRES_USER:=llamastack}
-      password: ${env.POSTGRES_PASSWORD:=llamastack}
-    models:
-    - metadata:
-        embedding_dimension: 384
-      model_id: all-MiniLM-L6-v2
-      provider_id: sentence-transformers
-      model_type: embedding
-    - metadata: {}
-      model_id: ${env.INFERENCE_MODEL}
-      provider_id: vllm-inference
-      model_type: llm
-    - metadata: {}
-      model_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
-      provider_id: vllm-safety
-      model_type: llm
-    shields:
-    - shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}
-    vector_dbs: []
-    datasets: []
-    scoring_fns: []
-    benchmarks: []
-    tool_groups:
-    - toolgroup_id: builtin::websearch
-      provider_id: tavily-search
-    - toolgroup_id: builtin::rag
-      provider_id: rag-runtime
-    server:
-      port: 8321
-      auth:
-        provider_config:
-          type: github_token
+  stack_run_config.yaml: "version: '2'\nimage_name: kubernetes-demo\napis:\n- agents\n-
+    inference\n- files\n- safety\n- telemetry\n- tool_runtime\n- vector_io\nproviders:\n
+    \ inference:\n  - provider_id: vllm-inference\n    provider_type: remote::vllm\n
+    \   config:\n      url: ${env.VLLM_URL:=http://localhost:8000/v1}\n      max_tokens:
+    ${env.VLLM_MAX_TOKENS:=4096}\n      api_token: ${env.VLLM_API_TOKEN:=fake}\n      tls_verify:
+    ${env.VLLM_TLS_VERIFY:=true}\n  - provider_id: vllm-safety\n    provider_type:
+    remote::vllm\n    config:\n      url: ${env.VLLM_SAFETY_URL:=http://localhost:8000/v1}\n
+    \     max_tokens: ${env.VLLM_MAX_TOKENS:=4096}\n      api_token: ${env.VLLM_API_TOKEN:=fake}\n
+    \     tls_verify: ${env.VLLM_TLS_VERIFY:=true}\n  - provider_id: sentence-transformers\n
+    \   provider_type: inline::sentence-transformers\n    config: {}\n  vector_io:\n
+    \ - provider_id: ${env.ENABLE_CHROMADB:+chromadb}\n    provider_type: remote::chromadb\n
+    \   config:\n      url: ${env.CHROMADB_URL:=}\n      kvstore:\n        type: postgres\n
+    \       host: ${env.POSTGRES_HOST:=localhost}\n        port: ${env.POSTGRES_PORT:=5432}\n
+    \       db: ${env.POSTGRES_DB:=llamastack}\n        user: ${env.POSTGRES_USER:=llamastack}\n
+    \       password: ${env.POSTGRES_PASSWORD:=llamastack}\n  files:\n  - provider_id:
+    meta-reference-files\n    provider_type: inline::localfs\n    config:\n      storage_dir:
+    ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}\n      metadata_store:\n
+    \       type: sqlite\n        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
+    \ \n  safety:\n  - provider_id: llama-guard\n    provider_type: inline::llama-guard\n
+    \   config:\n      excluded_categories: []\n  agents:\n  - provider_id: meta-reference\n
+    \   provider_type: inline::meta-reference\n    config:\n      persistence_store:\n
+    \       type: postgres\n        host: ${env.POSTGRES_HOST:=localhost}\n        port:
+    ${env.POSTGRES_PORT:=5432}\n        db: ${env.POSTGRES_DB:=llamastack}\n        user:
+    ${env.POSTGRES_USER:=llamastack}\n        password: ${env.POSTGRES_PASSWORD:=llamastack}\n
+    \     responses_store:\n        type: postgres\n        host: ${env.POSTGRES_HOST:=localhost}\n
+    \       port: ${env.POSTGRES_PORT:=5432}\n        db: ${env.POSTGRES_DB:=llamastack}\n
+    \       user: ${env.POSTGRES_USER:=llamastack}\n        password: ${env.POSTGRES_PASSWORD:=llamastack}\n
+    \ telemetry:\n  - provider_id: meta-reference\n    provider_type: inline::meta-reference\n
+    \   config:\n      service_name: \"${env.OTEL_SERVICE_NAME:=\\u200B}\"\n      sinks:
+    ${env.TELEMETRY_SINKS:=console}\n  tool_runtime:\n  - provider_id: brave-search\n
+    \   provider_type: remote::brave-search\n    config:\n      api_key: ${env.BRAVE_SEARCH_API_KEY:+}\n
+    \     max_results: 3\n  - provider_id: tavily-search\n    provider_type: remote::tavily-search\n
+    \   config:\n      api_key: ${env.TAVILY_SEARCH_API_KEY:+}\n      max_results:
+    3\n  - provider_id: rag-runtime\n    provider_type: inline::rag-runtime\n    config:
+    {}\n  - provider_id: model-context-protocol\n    provider_type: remote::model-context-protocol\n
+    \   config: {}\nmetadata_store:\n  type: postgres\n  host: ${env.POSTGRES_HOST:=localhost}\n
+    \ port: ${env.POSTGRES_PORT:=5432}\n  db: ${env.POSTGRES_DB:=llamastack}\n  user:
+    ${env.POSTGRES_USER:=llamastack}\n  password: ${env.POSTGRES_PASSWORD:=llamastack}\n
+    \ table_name: llamastack_kvstore\ninference_store:\n  type: postgres\n  host:
+    ${env.POSTGRES_HOST:=localhost}\n  port: ${env.POSTGRES_PORT:=5432}\n  db: ${env.POSTGRES_DB:=llamastack}\n
+    \ user: ${env.POSTGRES_USER:=llamastack}\n  password: ${env.POSTGRES_PASSWORD:=llamastack}\nmodels:\n-
+    metadata:\n    embedding_dimension: 384\n  model_id: all-MiniLM-L6-v2\n  provider_id:
+    sentence-transformers\n  model_type: embedding\n- metadata: {}\n  model_id: ${env.INFERENCE_MODEL}\n
+    \ provider_id: vllm-inference\n  model_type: llm\n- metadata: {}\n  model_id:
+    ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}\n  provider_id: vllm-safety\n
+    \ model_type: llm\nshields:\n- shield_id: ${env.SAFETY_MODEL:=meta-llama/Llama-Guard-3-1B}\nvector_dbs:
+    []\ndatasets: []\nscoring_fns: []\nbenchmarks: []\ntool_groups:\n- toolgroup_id:
+    builtin::websearch\n  provider_id: tavily-search\n- toolgroup_id: builtin::rag\n
+    \ provider_id: rag-runtime\nserver:\n  port: 8321\n  auth:\n    provider_config:\n
+    \     type: github_token\n"
 kind: ConfigMap
 metadata:
   creationTimestamp: null
diff --git a/docs/source/distributions/k8s/stack_run_config.yaml b/docs/source/distributions/k8s/stack_run_config.yaml
index a2d65e1a9..b841ab977 100644
--- a/docs/source/distributions/k8s/stack_run_config.yaml
+++ b/docs/source/distributions/k8s/stack_run_config.yaml
@@ -3,6 +3,7 @@ image_name: kubernetes-demo
 apis:
 - agents
 - inference
+- files
 - safety
 - telemetry
 - tool_runtime
@@ -38,6 +39,14 @@ providers:
         db: ${env.POSTGRES_DB:=llamastack}
         user: ${env.POSTGRES_USER:=llamastack}
         password: ${env.POSTGRES_PASSWORD:=llamastack}
+  files:
+  - provider_id: meta-reference-files
+    provider_type: inline::localfs
+    config:
+      storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
+      metadata_store:
+        type: sqlite
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
   safety:
   - provider_id: llama-guard
     provider_type: inline::llama-guard

From 1c23aeb9372fa3e1286a7d6d8210994000efae6d Mon Sep 17 00:00:00 2001
From: Cesare Pompeiano <cesare.pompeiano@gmail.com>
Date: Wed, 10 Sep 2025 11:19:21 +0200
Subject: [PATCH 52/76] feat: Add vector_db_id to chunk metadata (#3304)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

# What does this PR do?

When running RAG in a multi vector DB setting, it can be difficult to
trace where retrieved chunks originate from. This PR adds the
`vector_db_id` into each chunk’s metadata, making it easier to
understand which database a given chunk came from. This is helpful for
debugging and for analyzing retrieval behavior of multiple DBs.

Relevant code:

```python
for vector_db_id, result in zip(vector_db_ids, results):
    for chunk, score in zip(result.chunks, result.scores):
        if not hasattr(chunk, "metadata") or chunk.metadata is None:
            chunk.metadata = {}
        chunk.metadata["vector_db_id"] = vector_db_id

        chunks.append(chunk)
        scores.append(score)
```

## Test Plan

* Ran Llama Stack in debug mode.
* Verified that `vector_db_id` was added to each chunk’s metadata.
* Confirmed that the metadata was printed in the console when using the
RAG tool.

---------

Co-authored-by: are-ces <cpompeia@redhat.com>
Co-authored-by: Francisco Arceo <arceofrancisco@gmail.com>
---
 .../inline/tool_runtime/rag/memory.py         | 16 +++++-
 tests/unit/rag/test_rag_query.py              | 55 +++++++++++++++++++
 2 files changed, 69 insertions(+), 2 deletions(-)

diff --git a/llama_stack/providers/inline/tool_runtime/rag/memory.py b/llama_stack/providers/inline/tool_runtime/rag/memory.py
index cb526e8ee..aa629cca8 100644
--- a/llama_stack/providers/inline/tool_runtime/rag/memory.py
+++ b/llama_stack/providers/inline/tool_runtime/rag/memory.py
@@ -167,8 +167,18 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
             for vector_db_id in vector_db_ids
         ]
         results: list[QueryChunksResponse] = await asyncio.gather(*tasks)
-        chunks = [c for r in results for c in r.chunks]
-        scores = [s for r in results for s in r.scores]
+
+        chunks = []
+        scores = []
+
+        for vector_db_id, result in zip(vector_db_ids, results, strict=False):
+            for chunk, score in zip(result.chunks, result.scores, strict=False):
+                if not hasattr(chunk, "metadata") or chunk.metadata is None:
+                    chunk.metadata = {}
+                chunk.metadata["vector_db_id"] = vector_db_id
+
+                chunks.append(chunk)
+                scores.append(score)
 
         if not chunks:
             return RAGQueryResult(content=None)
@@ -203,6 +213,7 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
             metadata_keys_to_exclude_from_context = [
                 "token_count",
                 "metadata_token_count",
+                "vector_db_id",
             ]
             metadata_for_context = {}
             for k in chunk_metadata_keys_to_include_from_context:
@@ -227,6 +238,7 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
                 "document_ids": [c.metadata["document_id"] for c in chunks[: len(picked)]],
                 "chunks": [c.content for c in chunks[: len(picked)]],
                 "scores": scores[: len(picked)],
+                "vector_db_ids": [c.metadata["vector_db_id"] for c in chunks[: len(picked)]],
             },
         )
 
diff --git a/tests/unit/rag/test_rag_query.py b/tests/unit/rag/test_rag_query.py
index d18d90716..7b897bfe0 100644
--- a/tests/unit/rag/test_rag_query.py
+++ b/tests/unit/rag/test_rag_query.py
@@ -81,3 +81,58 @@ class TestRagQuery:
         # Test that invalid mode raises an error
         with pytest.raises(ValueError):
             RAGQueryConfig(mode="wrong_mode")
+
+    @pytest.mark.asyncio
+    async def test_query_adds_vector_db_id_to_chunk_metadata(self):
+        rag_tool = MemoryToolRuntimeImpl(
+            config=MagicMock(),
+            vector_io_api=MagicMock(),
+            inference_api=MagicMock(),
+        )
+
+        vector_db_ids = ["db1", "db2"]
+
+        # Fake chunks from each DB
+        chunk_metadata1 = ChunkMetadata(
+            document_id="doc1",
+            chunk_id="chunk1",
+            source="test_source1",
+            metadata_token_count=5,
+        )
+        chunk1 = Chunk(
+            content="chunk from db1",
+            metadata={"vector_db_id": "db1", "document_id": "doc1"},
+            stored_chunk_id="c1",
+            chunk_metadata=chunk_metadata1,
+        )
+
+        chunk_metadata2 = ChunkMetadata(
+            document_id="doc2",
+            chunk_id="chunk2",
+            source="test_source2",
+            metadata_token_count=5,
+        )
+        chunk2 = Chunk(
+            content="chunk from db2",
+            metadata={"vector_db_id": "db2", "document_id": "doc2"},
+            stored_chunk_id="c2",
+            chunk_metadata=chunk_metadata2,
+        )
+
+        rag_tool.vector_io_api.query_chunks = AsyncMock(
+            side_effect=[
+                QueryChunksResponse(chunks=[chunk1], scores=[0.9]),
+                QueryChunksResponse(chunks=[chunk2], scores=[0.8]),
+            ]
+        )
+
+        result = await rag_tool.query(content="test", vector_db_ids=vector_db_ids)
+        returned_chunks = result.metadata["chunks"]
+        returned_scores = result.metadata["scores"]
+        returned_doc_ids = result.metadata["document_ids"]
+        returned_vector_db_ids = result.metadata["vector_db_ids"]
+
+        assert returned_chunks == ["chunk from db1", "chunk from db2"]
+        assert returned_scores == (0.9, 0.8)
+        assert returned_doc_ids == ["doc1", "doc2"]
+        assert returned_vector_db_ids == ["db1", "db2"]

From 167143131053c8de6ea620a83ebdec41c0b24e50 Mon Sep 17 00:00:00 2001
From: Akram Ben Aissi <akram.benaissi@gmail.com>
Date: Wed, 10 Sep 2025 12:55:57 +0200
Subject: [PATCH 53/76] fix: Add missing files_api parameter to
 MemoryToolRuntimeImpl test (#3394)

# What does this PR do?
<!-- Provide a short summary of what this PR does and why. Link to
relevant issues if applicable. -->
The test_query_adds_vector_db_id_to_chunk_metadata test was failing
because MemoryToolRuntimeImpl.__init__() now requires a files_api
parameter.

Fixes failing unit tests for Python 3.12 and 3.13.

<!-- If resolving an issue, uncomment and update the line below -->
<!-- Closes #[issue-number] -->

## Test Plan
<!-- Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.* -->
---
 tests/unit/rag/test_rag_query.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/unit/rag/test_rag_query.py b/tests/unit/rag/test_rag_query.py
index 7b897bfe0..183b4d049 100644
--- a/tests/unit/rag/test_rag_query.py
+++ b/tests/unit/rag/test_rag_query.py
@@ -88,6 +88,7 @@ class TestRagQuery:
             config=MagicMock(),
             vector_io_api=MagicMock(),
             inference_api=MagicMock(),
+            files_api=MagicMock(),
         )
 
         vector_db_ids = ["db1", "db2"]

From c836fa29e3b9a587734764cc025551bce68fc349 Mon Sep 17 00:00:00 2001
From: Akram Ben Aissi <akram.benaissi@gmail.com>
Date: Wed, 10 Sep 2025 15:27:35 +0200
Subject: [PATCH 54/76] fix: pre-commit issues: non executable shebang file and
 removal of @pytest.mark.asyncio decorator  (#3397)

# What does this PR do?
<!-- Provide a short summary of what this PR does and why. Link to
relevant issues if applicable. -->
Fix pre-commit issues: non executable shebang file, @pytest.mark.asyncio
decorator

<!-- If resolving an issue, uncomment and update the line below -->
<!-- Closes #[issue-number] -->

## Test Plan
<!-- Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.* -->
---
 scripts/get_setup_env.py         | 0
 tests/unit/rag/test_rag_query.py | 1 -
 2 files changed, 1 deletion(-)
 mode change 100644 => 100755 scripts/get_setup_env.py

diff --git a/scripts/get_setup_env.py b/scripts/get_setup_env.py
old mode 100644
new mode 100755
diff --git a/tests/unit/rag/test_rag_query.py b/tests/unit/rag/test_rag_query.py
index 183b4d049..a45b66f02 100644
--- a/tests/unit/rag/test_rag_query.py
+++ b/tests/unit/rag/test_rag_query.py
@@ -82,7 +82,6 @@ class TestRagQuery:
         with pytest.raises(ValueError):
             RAGQueryConfig(mode="wrong_mode")
 
-    @pytest.mark.asyncio
     async def test_query_adds_vector_db_id_to_chunk_metadata(self):
         rag_tool = MemoryToolRuntimeImpl(
             config=MagicMock(),

From 0e27016cf23eca51a0f025897b44109b1b609b71 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Wed, 10 Sep 2025 09:39:29 -0400
Subject: [PATCH 55/76] chore: update the vertexai inference impl to use
 openai-python for openai-compat functions (#3377)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

# What does this PR do?

update VertexAI inference provider to use openai-python for
openai-compat functions

## Test Plan

```
$ VERTEX_AI_PROJECT=... uv run llama stack build --image-type venv --providers inference=remote::vertexai --run
...
$ LLAMA_STACK_CONFIG=http://localhost:8321 uv run --group test pytest -v -ra --text-model vertexai/vertex_ai/gemini-2.5-flash tests/integration/inference/test_openai_completion.py
...
```

i don't have an account to test this. `get_api_key` may also need to be
updated per
https://cloud.google.com/vertex-ai/generative-ai/docs/start/openai

---------

Signed-off-by: Sébastien Han <seb@redhat.com>
Co-authored-by: Sébastien Han <seb@redhat.com>
---
 llama_stack/providers/registry/inference.py   |  2 +-
 .../remote/inference/vertexai/vertexai.py     | 33 ++++++++++++++++---
 .../inference/test_openai_completion.py       |  3 ++
 3 files changed, 33 insertions(+), 5 deletions(-)

diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index 4176f85a6..541fbb432 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -218,7 +218,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="vertexai",
-                pip_packages=["litellm", "google-cloud-aiplatform"],
+                pip_packages=["litellm", "google-cloud-aiplatform", "openai"],
                 module="llama_stack.providers.remote.inference.vertexai",
                 config_class="llama_stack.providers.remote.inference.vertexai.VertexAIConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.vertexai.config.VertexAIProviderDataValidator",
diff --git a/llama_stack/providers/remote/inference/vertexai/vertexai.py b/llama_stack/providers/remote/inference/vertexai/vertexai.py
index 8807fd0e6..27f953ab9 100644
--- a/llama_stack/providers/remote/inference/vertexai/vertexai.py
+++ b/llama_stack/providers/remote/inference/vertexai/vertexai.py
@@ -6,16 +6,20 @@
 
 from typing import Any
 
+import google.auth.transport.requests
+from google.auth import default
+
 from llama_stack.apis.inference import ChatCompletionRequest
 from llama_stack.providers.utils.inference.litellm_openai_mixin import (
     LiteLLMOpenAIMixin,
 )
+from llama_stack.providers.utils.inference.openai_mixin import OpenAIMixin
 
 from .config import VertexAIConfig
 from .models import MODEL_ENTRIES
 
 
-class VertexAIInferenceAdapter(LiteLLMOpenAIMixin):
+class VertexAIInferenceAdapter(OpenAIMixin, LiteLLMOpenAIMixin):
     def __init__(self, config: VertexAIConfig) -> None:
         LiteLLMOpenAIMixin.__init__(
             self,
@@ -27,9 +31,30 @@ class VertexAIInferenceAdapter(LiteLLMOpenAIMixin):
         self.config = config
 
     def get_api_key(self) -> str:
-        # Vertex AI doesn't use API keys, it uses Application Default Credentials
-        # Return empty string to let litellm handle authentication via ADC
-        return ""
+        """
+        Get an access token for Vertex AI using Application Default Credentials.
+
+        Vertex AI uses ADC instead of API keys. This method obtains an access token
+        from the default credentials and returns it for use with the OpenAI-compatible client.
+        """
+        try:
+            # Get default credentials - will read from GOOGLE_APPLICATION_CREDENTIALS
+            credentials, _ = default(scopes=["https://www.googleapis.com/auth/cloud-platform"])
+            credentials.refresh(google.auth.transport.requests.Request())
+            return credentials.token
+        except Exception:
+            # If we can't get credentials, return empty string to let LiteLLM handle it
+            # This allows the LiteLLM mixin to work with ADC directly
+            return ""
+
+    def get_base_url(self) -> str:
+        """
+        Get the Vertex AI OpenAI-compatible API base URL.
+
+        Returns the Vertex AI OpenAI-compatible endpoint URL.
+        Source: https://cloud.google.com/vertex-ai/generative-ai/docs/start/openai
+        """
+        return f"https://{self.config.location}-aiplatform.googleapis.com/v1/projects/{self.config.project}/locations/{self.config.location}/endpoints/openapi"
 
     async def _get_params(self, request: ChatCompletionRequest) -> dict[str, Any]:
         # Get base parameters from parent
diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index df1184f1c..f9c837ebd 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -76,6 +76,9 @@ def skip_if_doesnt_support_n(client_with_models, model_id):
         "remote::gemini",
         # https://docs.anthropic.com/en/api/openai-sdk#simple-fields
         "remote::anthropic",
+        "remote::vertexai",
+        #  Error code: 400 - [{'error': {'code': 400, 'message': 'Unable to submit request because candidateCount must be 1 but
+        #  the entered value was 2. Update the candidateCount value and try again.', 'status': 'INVALID_ARGUMENT'}
     ):
         pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support n param.")
 

From c86e45496e32164286eb8920d2e979a45be31ea3 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?S=C3=A9bastien=20Han?= <seb@redhat.com>
Date: Wed, 10 Sep 2025 16:00:46 +0200
Subject: [PATCH 56/76] ci: Re-enable pre-commit to fail (#3399)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

If pre-commit fails, the workflow must fail.

---------

Signed-off-by: Sébastien Han <seb@redhat.com>
---
 .github/workflows/pre-commit.yml                            | 1 -
 llama_stack/providers/remote/inference/vertexai/vertexai.py | 2 +-
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/.github/workflows/pre-commit.yml b/.github/workflows/pre-commit.yml
index 792162262..000208043 100644
--- a/.github/workflows/pre-commit.yml
+++ b/.github/workflows/pre-commit.yml
@@ -48,7 +48,6 @@ jobs:
         working-directory: llama_stack/ui
 
       - uses: pre-commit/action@2c7b3805fd2a0fd8c1884dcaebf91fc102a13ecd # v3.0.1
-        continue-on-error: true
         env:
           SKIP: no-commit-to-branch
           RUFF_OUTPUT_FORMAT: github
diff --git a/llama_stack/providers/remote/inference/vertexai/vertexai.py b/llama_stack/providers/remote/inference/vertexai/vertexai.py
index 27f953ab9..8996543e7 100644
--- a/llama_stack/providers/remote/inference/vertexai/vertexai.py
+++ b/llama_stack/providers/remote/inference/vertexai/vertexai.py
@@ -41,7 +41,7 @@ class VertexAIInferenceAdapter(OpenAIMixin, LiteLLMOpenAIMixin):
             # Get default credentials - will read from GOOGLE_APPLICATION_CREDENTIALS
             credentials, _ = default(scopes=["https://www.googleapis.com/auth/cloud-platform"])
             credentials.refresh(google.auth.transport.requests.Request())
-            return credentials.token
+            return str(credentials.token)
         except Exception:
             # If we can't get credentials, return empty string to let LiteLLM handle it
             # This allows the LiteLLM mixin to work with ADC directly

From 935b8e28de29400a4b42d8b54169341c5244fec7 Mon Sep 17 00:00:00 2001
From: slekkala1 <swapna942@meta.com>
Date: Wed, 10 Sep 2025 08:48:01 -0700
Subject: [PATCH 57/76] fix: Fireworks chat completion broken due to telemetry
 (#3392)

# What does this PR do?
Fix fireworks chat completion broken due to telemetry expecting
response.usage
 Closes https://github.com/llamastack/llama-stack/issues/3391

## Test Plan
1. `uv run --with llama-stack llama stack build --distro starter
--image-type venv --run`
Try

```
curl -X POST http://0.0.0.0:8321/v1/openai/v1/chat/completions \
    -H "Content-Type: application/json" \
    -d '{
      "model": "fireworks/accounts/fireworks/models/llama-v3p1-8b-instruct",
      "messages": [{"role": "user", "content": "Hello!"}]
    }'
```
```
{"id":"chatcmpl-ee922a08-0df0-4974-b0d3-b322113e8bc0","choices":[{"message":{"role":"assistant","content":"Hello! How can I assist you today?","name":null,"tool_calls":null},"finish_reason":"stop","index":0,"logprobs":null}],"object":"chat.completion","created":1757456375,"model":"fireworks/accounts/fireworks/models/llama-v3p1-8b-instruct"}%
```

Without fix fails as mentioned in
https://github.com/llamastack/llama-stack/issues/3391

Co-authored-by: Francisco Arceo <arceofrancisco@gmail.com>
---
 llama_stack/core/routers/inference.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/llama_stack/core/routers/inference.py b/llama_stack/core/routers/inference.py
index 045093fe0..23972deb5 100644
--- a/llama_stack/core/routers/inference.py
+++ b/llama_stack/core/routers/inference.py
@@ -423,7 +423,7 @@ class InferenceRouter(Inference):
             # response_stream = await provider.openai_completion(**params)
 
         response = await provider.openai_completion(**params)
-        if self.telemetry:
+        if self.telemetry and getattr(response, "usage", None):
             metrics = self._construct_metrics(
                 prompt_tokens=response.usage.prompt_tokens,
                 completion_tokens=response.usage.completion_tokens,
@@ -529,7 +529,7 @@ class InferenceRouter(Inference):
         if self.store:
             asyncio.create_task(self.store.store_chat_completion(response, messages))
 
-        if self.telemetry:
+        if self.telemetry and getattr(response, "usage", None):
             metrics = self._construct_metrics(
                 prompt_tokens=response.usage.prompt_tokens,
                 completion_tokens=response.usage.completion_tokens,

From f6bf36343df7c69c9f26ae5163cbfb6491ca7247 Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Wed, 10 Sep 2025 11:52:23 -0700
Subject: [PATCH 58/76] chore: logging perf improvments (#3393)

# What does this PR do?
- Use BackgroundLogger when logging metric events.
- Reuse event loop in BackgroundLogger

## Test Plan
```
cd /docs/source/distributions/k8s-benchmark
# start mock server
python openai-mock-server.py --port 8000
# start stack server
LLAMA_STACK_LOGGING="all=WARNING" uv run --with llama-stack python -m llama_stack.core.server.server docs/source/distributions/k8s-benchmark/stack_run_config.yaml
# run benchmark script
uv run python3 benchmark.py --duration 120 --concurrent 50 --base-url=http://localhost:8321/v1/openai/v1 --model=vllm-inference/meta-llama/Llama-3.2-3B-Instruct
```
### RPS from 57 -> 62
---
 llama_stack/core/routers/inference.py         | 14 ++++----
 .../providers/utils/telemetry/tracing.py      | 34 +++++++++++++------
 2 files changed, 31 insertions(+), 17 deletions(-)

diff --git a/llama_stack/core/routers/inference.py b/llama_stack/core/routers/inference.py
index 23972deb5..9593dd5b9 100644
--- a/llama_stack/core/routers/inference.py
+++ b/llama_stack/core/routers/inference.py
@@ -63,7 +63,7 @@ from llama_stack.models.llama.llama3.chat_format import ChatFormat
 from llama_stack.models.llama.llama3.tokenizer import Tokenizer
 from llama_stack.providers.datatypes import HealthResponse, HealthStatus, RoutingTable
 from llama_stack.providers.utils.inference.inference_store import InferenceStore
-from llama_stack.providers.utils.telemetry.tracing import get_current_span
+from llama_stack.providers.utils.telemetry.tracing import enqueue_event, get_current_span
 
 logger = get_logger(name=__name__, category="core::routers")
 
@@ -160,7 +160,7 @@ class InferenceRouter(Inference):
         metrics = self._construct_metrics(prompt_tokens, completion_tokens, total_tokens, model)
         if self.telemetry:
             for metric in metrics:
-                await self.telemetry.log_event(metric)
+                enqueue_event(metric)
         return [MetricInResponse(metric=metric.metric, value=metric.value) for metric in metrics]
 
     async def _count_tokens(
@@ -431,7 +431,7 @@ class InferenceRouter(Inference):
                 model=model_obj,
             )
             for metric in metrics:
-                await self.telemetry.log_event(metric)
+                enqueue_event(metric)
 
             # these metrics will show up in the client response.
             response.metrics = (
@@ -537,7 +537,7 @@ class InferenceRouter(Inference):
                 model=model_obj,
             )
             for metric in metrics:
-                await self.telemetry.log_event(metric)
+                enqueue_event(metric)
             # these metrics will show up in the client response.
             response.metrics = (
                 metrics if not hasattr(response, "metrics") or response.metrics is None else response.metrics + metrics
@@ -664,7 +664,7 @@ class InferenceRouter(Inference):
                             "completion_tokens",
                             "total_tokens",
                         ]:  # Only log completion and total tokens
-                            await self.telemetry.log_event(metric)
+                            enqueue_event(metric)
 
                         # Return metrics in response
                         async_metrics = [
@@ -710,7 +710,7 @@ class InferenceRouter(Inference):
             )
             for metric in completion_metrics:
                 if metric.metric in ["completion_tokens", "total_tokens"]:  # Only log completion and total tokens
-                    await self.telemetry.log_event(metric)
+                    enqueue_event(metric)
 
             # Return metrics in response
             return [MetricInResponse(metric=metric.metric, value=metric.value) for metric in completion_metrics]
@@ -806,7 +806,7 @@ class InferenceRouter(Inference):
                             model=model,
                         )
                         for metric in metrics:
-                            await self.telemetry.log_event(metric)
+                            enqueue_event(metric)
 
                 yield chunk
         finally:
diff --git a/llama_stack/providers/utils/telemetry/tracing.py b/llama_stack/providers/utils/telemetry/tracing.py
index 7694003b5..9969b1055 100644
--- a/llama_stack/providers/utils/telemetry/tracing.py
+++ b/llama_stack/providers/utils/telemetry/tracing.py
@@ -18,6 +18,7 @@ from functools import wraps
 from typing import Any
 
 from llama_stack.apis.telemetry import (
+    Event,
     LogSeverity,
     Span,
     SpanEndPayload,
@@ -98,7 +99,7 @@ class BackgroundLogger:
     def __init__(self, api: Telemetry, capacity: int = 100000):
         self.api = api
         self.log_queue: queue.Queue[Any] = queue.Queue(maxsize=capacity)
-        self.worker_thread = threading.Thread(target=self._process_logs, daemon=True)
+        self.worker_thread = threading.Thread(target=self._worker, daemon=True)
         self.worker_thread.start()
         self._last_queue_full_log_time: float = 0.0
         self._dropped_since_last_notice: int = 0
@@ -118,12 +119,16 @@ class BackgroundLogger:
                 self._last_queue_full_log_time = current_time
                 self._dropped_since_last_notice = 0
 
-    def _process_logs(self):
+    def _worker(self):
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        loop.run_until_complete(self._process_logs())
+
+    async def _process_logs(self):
         while True:
             try:
                 event = self.log_queue.get()
-                # figure out how to use a thread's native loop
-                asyncio.run(self.api.log_event(event))
+                await self.api.log_event(event)
             except Exception:
                 import traceback
 
@@ -136,6 +141,19 @@ class BackgroundLogger:
         self.log_queue.join()
 
 
+def enqueue_event(event: Event) -> None:
+    """Enqueue a telemetry event to the background logger if available.
+
+    This provides a non-blocking path for routers and other hot paths to
+    submit telemetry without awaiting the Telemetry API, reducing contention
+    with the main event loop.
+    """
+    global BACKGROUND_LOGGER
+    if BACKGROUND_LOGGER is None:
+        raise RuntimeError("Telemetry API not initialized")
+    BACKGROUND_LOGGER.log_event(event)
+
+
 class TraceContext:
     spans: list[Span] = []
 
@@ -256,11 +274,7 @@ class TelemetryHandler(logging.Handler):
         if record.module in ("asyncio", "selector_events"):
             return
 
-        global CURRENT_TRACE_CONTEXT, BACKGROUND_LOGGER
-
-        if BACKGROUND_LOGGER is None:
-            raise RuntimeError("Telemetry API not initialized")
-
+        global CURRENT_TRACE_CONTEXT
         context = CURRENT_TRACE_CONTEXT.get()
         if context is None:
             return
@@ -269,7 +283,7 @@ class TelemetryHandler(logging.Handler):
         if span is None:
             return
 
-        BACKGROUND_LOGGER.log_event(
+        enqueue_event(
             UnstructuredLogEvent(
                 trace_id=span.trace_id,
                 span_id=span.span_id,

From a6b1588dc612df097d4fecce317547515b281ec6 Mon Sep 17 00:00:00 2001
From: Francisco Arceo <arceofrancisco@gmail.com>
Date: Wed, 10 Sep 2025 12:53:38 -0600
Subject: [PATCH 59/76] revert: Fireworks chat completion broken due to
 telemetry (#3402)

Reverts llamastack/llama-stack#3392
---
 llama_stack/core/routers/inference.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/llama_stack/core/routers/inference.py b/llama_stack/core/routers/inference.py
index 9593dd5b9..2ed2d0439 100644
--- a/llama_stack/core/routers/inference.py
+++ b/llama_stack/core/routers/inference.py
@@ -423,7 +423,7 @@ class InferenceRouter(Inference):
             # response_stream = await provider.openai_completion(**params)
 
         response = await provider.openai_completion(**params)
-        if self.telemetry and getattr(response, "usage", None):
+        if self.telemetry:
             metrics = self._construct_metrics(
                 prompt_tokens=response.usage.prompt_tokens,
                 completion_tokens=response.usage.completion_tokens,
@@ -529,7 +529,7 @@ class InferenceRouter(Inference):
         if self.store:
             asyncio.create_task(self.store.store_chat_completion(response, messages))
 
-        if self.telemetry and getattr(response, "usage", None):
+        if self.telemetry:
             metrics = self._construct_metrics(
                 prompt_tokens=response.usage.prompt_tokens,
                 completion_tokens=response.usage.completion_tokens,

From e6edc1f93425032f35f4198a197ba31b5b11d8ee Mon Sep 17 00:00:00 2001
From: Derek Higgins <derekh@redhat.com>
Date: Wed, 10 Sep 2025 19:54:10 +0100
Subject: [PATCH 60/76] fix: unbound variable error in
 schedule-record-workflow.sh (#3401)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Initialize INPUTS variable to prevent 'unbound variable' error

Fixes:
./scripts/github/schedule-record-workflow.sh: line 246: INPUTS: unbound
variable │
---
 scripts/github/schedule-record-workflow.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/scripts/github/schedule-record-workflow.sh b/scripts/github/schedule-record-workflow.sh
index c292e53e6..44b0947b6 100755
--- a/scripts/github/schedule-record-workflow.sh
+++ b/scripts/github/schedule-record-workflow.sh
@@ -239,8 +239,9 @@ echo "Test pattern: ${TEST_PATTERN:-"(none)"}"
 echo ""
 
 # Prepare inputs for gh workflow run
+INPUTS=
 if [[ -n "$TEST_SUBDIRS" ]]; then
-    INPUTS="-f subdirs='$TEST_SUBDIRS'"
+    INPUTS="$INPUTS -f subdirs='$TEST_SUBDIRS'"
 fi
 if [[ -n "$TEST_SETUP" ]]; then
     INPUTS="$INPUTS -f test-setup='$TEST_SETUP'"

From e980436a2ed98dd725f76dfcec12235ed1d6cc82 Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Wed, 10 Sep 2025 11:57:42 -0700
Subject: [PATCH 61/76] chore: introduce write queue for inference_store
 (#3383)

# What does this PR do?
Adds a write worker queue for writes to inference store. This avoids
overwhelming request processing with slow inference writes.

## Test Plan

Benchmark:
```
cd /docs/source/distributions/k8s-benchmark
# start mock server
python openai-mock-server.py --port 8000
# start stack server
LLAMA_STACK_LOGGING="all=WARNING" uv run --with llama-stack python -m llama_stack.core.server.server docs/source/distributions/k8s-benchmark/stack_run_config.yaml
# run benchmark script
uv run python3 benchmark.py --duration 120 --concurrent 50 --base-url=http://localhost:8321/v1/openai/v1 --model=vllm-inference/meta-llama/Llama-3.2-3B-Instruct
```
## RPS from 21 -> 57
---
 .../distributions/k8s-benchmark/benchmark.py  | 19 ++--
 .../k8s-benchmark/stack_run_config.yaml       |  9 ++
 llama_stack/core/datatypes.py                 | 13 ++-
 llama_stack/core/routers/__init__.py          |  5 +-
 llama_stack/core/routers/inference.py         |  5 +
 .../utils/inference/inference_store.py        | 98 +++++++++++++++++--
 .../utils/inference/test_inference_store.py   | 12 +++
 7 files changed, 139 insertions(+), 22 deletions(-)

diff --git a/docs/source/distributions/k8s-benchmark/benchmark.py b/docs/source/distributions/k8s-benchmark/benchmark.py
index 3d0d18150..83ba9602a 100644
--- a/docs/source/distributions/k8s-benchmark/benchmark.py
+++ b/docs/source/distributions/k8s-benchmark/benchmark.py
@@ -58,14 +58,6 @@ class BenchmarkStats:
         
         print(f"\n{'='*60}")
         print(f"BENCHMARK RESULTS")
-        print(f"{'='*60}")
-        print(f"Total time: {total_time:.2f}s")
-        print(f"Concurrent users: {self.concurrent_users}")
-        print(f"Total requests: {self.total_requests}")
-        print(f"Successful requests: {self.success_count}")
-        print(f"Failed requests: {len(self.errors)}")
-        print(f"Success rate: {success_rate:.1f}%")
-        print(f"Requests per second: {self.success_count / total_time:.2f}")
         
         print(f"\nResponse Time Statistics:")
         print(f"  Mean: {statistics.mean(self.response_times):.3f}s")
@@ -106,6 +98,15 @@ class BenchmarkStats:
             print(f"  Mean chunks per response: {statistics.mean(self.chunks_received):.1f}")
             print(f"  Total chunks received: {sum(self.chunks_received)}")
         
+        print(f"{'='*60}")
+        print(f"Total time: {total_time:.2f}s")
+        print(f"Concurrent users: {self.concurrent_users}")
+        print(f"Total requests: {self.total_requests}")
+        print(f"Successful requests: {self.success_count}")
+        print(f"Failed requests: {len(self.errors)}")
+        print(f"Success rate: {success_rate:.1f}%")
+        print(f"Requests per second: {self.success_count / total_time:.2f}")
+        
         if self.errors:
             print(f"\nErrors (showing first 5):")
             for error in self.errors[:5]:
@@ -215,7 +216,7 @@ class LlamaStackBenchmark:
                         await asyncio.sleep(1)  # Report every second
                         if time.time() >= last_report_time + 10:  # Report every 10 seconds
                             elapsed = time.time() - stats.start_time
-                            print(f"Completed: {stats.total_requests} requests in {elapsed:.1f}s")
+                            print(f"Completed: {stats.total_requests} requests in {elapsed:.1f}s, RPS: {stats.total_requests / elapsed:.1f}")
                             last_report_time = time.time()
                     except asyncio.CancelledError:
                         break
diff --git a/docs/source/distributions/k8s-benchmark/stack_run_config.yaml b/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
index f8ff7811b..5a9e2ae4f 100644
--- a/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
+++ b/docs/source/distributions/k8s-benchmark/stack_run_config.yaml
@@ -2,6 +2,7 @@ version: '2'
 image_name: kubernetes-benchmark-demo
 apis:
 - agents
+- files
 - inference
 - files
 - safety
@@ -20,6 +21,14 @@ providers:
   - provider_id: sentence-transformers
     provider_type: inline::sentence-transformers
     config: {}
+  files:
+  - provider_id: meta-reference-files
+    provider_type: inline::localfs
+    config:
+      storage_dir: ${env.FILES_STORAGE_DIR:=~/.llama/distributions/starter/files}
+      metadata_store:
+        type: sqlite
+        db_path: ${env.SQLITE_STORE_DIR:=~/.llama/distributions/starter}/files_metadata.db
   vector_io:
   - provider_id: ${env.ENABLE_CHROMADB:+chromadb}
     provider_type: remote::chromadb
diff --git a/llama_stack/core/datatypes.py b/llama_stack/core/datatypes.py
index 0f348b067..faaeefd01 100644
--- a/llama_stack/core/datatypes.py
+++ b/llama_stack/core/datatypes.py
@@ -431,6 +431,12 @@ class ServerConfig(BaseModel):
     )
 
 
+class InferenceStoreConfig(BaseModel):
+    sql_store_config: SqlStoreConfig
+    max_write_queue_size: int = Field(default=10000, description="Max queued writes for inference store")
+    num_writers: int = Field(default=4, description="Number of concurrent background writers")
+
+
 class StackRunConfig(BaseModel):
     version: int = LLAMA_STACK_RUN_CONFIG_VERSION
 
@@ -464,11 +470,12 @@ Configuration for the persistence store used by the distribution registry. If no
 a default SQLite store will be used.""",
     )
 
-    inference_store: SqlStoreConfig | None = Field(
+    inference_store: InferenceStoreConfig | SqlStoreConfig | None = Field(
         default=None,
         description="""
-Configuration for the persistence store used by the inference API. If not specified,
-a default SQLite store will be used.""",
+Configuration for the persistence store used by the inference API. Can be either a
+InferenceStoreConfig (with queue tuning parameters) or a SqlStoreConfig (deprecated).
+If not specified, a default SQLite store will be used.""",
     )
 
     # registry of "resources" in the distribution
diff --git a/llama_stack/core/routers/__init__.py b/llama_stack/core/routers/__init__.py
index 1faace34a..f129f8ede 100644
--- a/llama_stack/core/routers/__init__.py
+++ b/llama_stack/core/routers/__init__.py
@@ -78,7 +78,10 @@ async def get_auto_router_impl(
 
     # TODO: move pass configs to routers instead
     if api == Api.inference and run_config.inference_store:
-        inference_store = InferenceStore(run_config.inference_store, policy)
+        inference_store = InferenceStore(
+            config=run_config.inference_store,
+            policy=policy,
+        )
         await inference_store.initialize()
         api_to_dep_impl["store"] = inference_store
 
diff --git a/llama_stack/core/routers/inference.py b/llama_stack/core/routers/inference.py
index 2ed2d0439..762d7073e 100644
--- a/llama_stack/core/routers/inference.py
+++ b/llama_stack/core/routers/inference.py
@@ -90,6 +90,11 @@ class InferenceRouter(Inference):
 
     async def shutdown(self) -> None:
         logger.debug("InferenceRouter.shutdown")
+        if self.store:
+            try:
+                await self.store.shutdown()
+            except Exception as e:
+                logger.warning(f"Error during InferenceStore shutdown: {e}")
 
     async def register_model(
         self,
diff --git a/llama_stack/providers/utils/inference/inference_store.py b/llama_stack/providers/utils/inference/inference_store.py
index 43006cfd5..8c69b1683 100644
--- a/llama_stack/providers/utils/inference/inference_store.py
+++ b/llama_stack/providers/utils/inference/inference_store.py
@@ -3,6 +3,9 @@
 #
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
+import asyncio
+from typing import Any
+
 from llama_stack.apis.inference import (
     ListOpenAIChatCompletionResponse,
     OpenAIChatCompletion,
@@ -10,24 +13,43 @@ from llama_stack.apis.inference import (
     OpenAIMessageParam,
     Order,
 )
-from llama_stack.core.datatypes import AccessRule
-from llama_stack.core.utils.config_dirs import RUNTIME_BASE_DIR
+from llama_stack.core.datatypes import AccessRule, InferenceStoreConfig
+from llama_stack.log import get_logger
 
 from ..sqlstore.api import ColumnDefinition, ColumnType
 from ..sqlstore.authorized_sqlstore import AuthorizedSqlStore
-from ..sqlstore.sqlstore import SqliteSqlStoreConfig, SqlStoreConfig, sqlstore_impl
+from ..sqlstore.sqlstore import SqlStoreConfig, SqlStoreType, sqlstore_impl
+
+logger = get_logger(name=__name__, category="inference_store")
 
 
 class InferenceStore:
-    def __init__(self, sql_store_config: SqlStoreConfig, policy: list[AccessRule]):
-        if not sql_store_config:
-            sql_store_config = SqliteSqlStoreConfig(
-                db_path=(RUNTIME_BASE_DIR / "sqlstore.db").as_posix(),
+    def __init__(
+        self,
+        config: InferenceStoreConfig | SqlStoreConfig,
+        policy: list[AccessRule],
+    ):
+        # Handle backward compatibility
+        if not isinstance(config, InferenceStoreConfig):
+            # Legacy: SqlStoreConfig passed directly as config
+            config = InferenceStoreConfig(
+                sql_store_config=config,
             )
-        self.sql_store_config = sql_store_config
+
+        self.config = config
+        self.sql_store_config = config.sql_store_config
         self.sql_store = None
         self.policy = policy
 
+        # Disable write queue for SQLite to avoid concurrency issues
+        self.enable_write_queue = self.sql_store_config.type != SqlStoreType.sqlite
+
+        # Async write queue and worker control
+        self._queue: asyncio.Queue[tuple[OpenAIChatCompletion, list[OpenAIMessageParam]]] | None = None
+        self._worker_tasks: list[asyncio.Task[Any]] = []
+        self._max_write_queue_size: int = config.max_write_queue_size
+        self._num_writers: int = max(1, config.num_writers)
+
     async def initialize(self):
         """Create the necessary tables if they don't exist."""
         self.sql_store = AuthorizedSqlStore(sqlstore_impl(self.sql_store_config))
@@ -42,10 +64,68 @@ class InferenceStore:
             },
         )
 
+        if self.enable_write_queue:
+            self._queue = asyncio.Queue(maxsize=self._max_write_queue_size)
+            for _ in range(self._num_writers):
+                self._worker_tasks.append(asyncio.create_task(self._worker_loop()))
+        else:
+            logger.info("Write queue disabled for SQLite to avoid concurrency issues")
+
+    async def shutdown(self) -> None:
+        if not self._worker_tasks:
+            return
+        if self._queue is not None:
+            await self._queue.join()
+        for t in self._worker_tasks:
+            if not t.done():
+                t.cancel()
+        for t in self._worker_tasks:
+            try:
+                await t
+            except asyncio.CancelledError:
+                pass
+        self._worker_tasks.clear()
+
+    async def flush(self) -> None:
+        """Wait for all queued writes to complete. Useful for testing."""
+        if self.enable_write_queue and self._queue is not None:
+            await self._queue.join()
+
     async def store_chat_completion(
         self, chat_completion: OpenAIChatCompletion, input_messages: list[OpenAIMessageParam]
     ) -> None:
-        if not self.sql_store:
+        if self.enable_write_queue:
+            if self._queue is None:
+                raise ValueError("Inference store is not initialized")
+            try:
+                self._queue.put_nowait((chat_completion, input_messages))
+            except asyncio.QueueFull:
+                logger.warning(
+                    f"Write queue full; adding chat completion id={getattr(chat_completion, 'id', '<unknown>')}"
+                )
+                await self._queue.put((chat_completion, input_messages))
+        else:
+            await self._write_chat_completion(chat_completion, input_messages)
+
+    async def _worker_loop(self) -> None:
+        assert self._queue is not None
+        while True:
+            try:
+                item = await self._queue.get()
+            except asyncio.CancelledError:
+                break
+            chat_completion, input_messages = item
+            try:
+                await self._write_chat_completion(chat_completion, input_messages)
+            except Exception as e:  # noqa: BLE001
+                logger.error(f"Error writing chat completion: {e}")
+            finally:
+                self._queue.task_done()
+
+    async def _write_chat_completion(
+        self, chat_completion: OpenAIChatCompletion, input_messages: list[OpenAIMessageParam]
+    ) -> None:
+        if self.sql_store is None:
             raise ValueError("Inference store is not initialized")
 
         data = chat_completion.model_dump()
diff --git a/tests/unit/utils/inference/test_inference_store.py b/tests/unit/utils/inference/test_inference_store.py
index 730f54a05..f6d63490a 100644
--- a/tests/unit/utils/inference/test_inference_store.py
+++ b/tests/unit/utils/inference/test_inference_store.py
@@ -65,6 +65,9 @@ async def test_inference_store_pagination_basic():
             input_messages = [OpenAIUserMessageParam(role="user", content=f"Test message for {completion_id}")]
             await store.store_chat_completion(completion, input_messages)
 
+        # Wait for all queued writes to complete
+        await store.flush()
+
         # Test 1: First page with limit=2, descending order (default)
         result = await store.list_chat_completions(limit=2, order=Order.desc)
         assert len(result.data) == 2
@@ -108,6 +111,9 @@ async def test_inference_store_pagination_ascending():
             input_messages = [OpenAIUserMessageParam(role="user", content=f"Test message for {completion_id}")]
             await store.store_chat_completion(completion, input_messages)
 
+        # Wait for all queued writes to complete
+        await store.flush()
+
         # Test ascending order pagination
         result = await store.list_chat_completions(limit=1, order=Order.asc)
         assert len(result.data) == 1
@@ -143,6 +149,9 @@ async def test_inference_store_pagination_with_model_filter():
             input_messages = [OpenAIUserMessageParam(role="user", content=f"Test message for {completion_id}")]
             await store.store_chat_completion(completion, input_messages)
 
+        # Wait for all queued writes to complete
+        await store.flush()
+
         # Test pagination with model filter
         result = await store.list_chat_completions(limit=1, model="model-a", order=Order.desc)
         assert len(result.data) == 1
@@ -190,6 +199,9 @@ async def test_inference_store_pagination_no_limit():
             input_messages = [OpenAIUserMessageParam(role="user", content=f"Test message for {completion_id}")]
             await store.store_chat_completion(completion, input_messages)
 
+        # Wait for all queued writes to complete
+        await store.flush()
+
         # Test without limit
         result = await store.list_chat_completions(order=Order.desc)
         assert len(result.data) == 2

From 7394828c7a84de2c3af0ca37546db17d6a703507 Mon Sep 17 00:00:00 2001
From: Alexey Rybak <50731695+reluctantfuturist@users.noreply.github.com>
Date: Wed, 10 Sep 2025 12:43:36 -0700
Subject: [PATCH 62/76] docs: horizontal nav bar (#3407)

# What does this PR do?
* Adds a horizontal nav bar for easy access to the API reference and the
Llama Stack Github repo

<img width="2696" height="520" alt="image"
src="https://github.com/user-attachments/assets/82daffe1-c206-4e20-b95b-1e090011eecc"
/>

## Test Plan
* Built the docs and ran the local HTML server to verify changes
---
 docs/_static/css/my_theme.css     | 101 ++++++++++++++++++++++++++++++
 docs/_static/js/horizontal_nav.js |  44 +++++++++++++
 docs/source/conf.py               |   1 +
 3 files changed, 146 insertions(+)
 create mode 100644 docs/_static/js/horizontal_nav.js

diff --git a/docs/_static/css/my_theme.css b/docs/_static/css/my_theme.css
index d078ec057..7dcd97c9b 100644
--- a/docs/_static/css/my_theme.css
+++ b/docs/_static/css/my_theme.css
@@ -1,5 +1,106 @@
 @import url("theme.css");
 
+/* Horizontal Navigation Bar */
+.horizontal-nav {
+    background-color: #ffffff;
+    border-bottom: 1px solid #e5e5e5;
+    padding: 0;
+    position: fixed;
+    top: 0;
+    left: 0;
+    right: 0;
+    z-index: 1050;
+    height: 50px;
+    box-shadow: 0 2px 4px rgba(0,0,0,0.1);
+}
+
+[data-theme="dark"] .horizontal-nav {
+    background-color: #1a1a1a;
+    border-bottom: 1px solid #333;
+}
+
+.horizontal-nav .nav-container {
+    max-width: 1200px;
+    margin: 0 auto;
+    display: flex;
+    align-items: center;
+    justify-content: space-between;
+    padding: 0 20px;
+    height: 100%;
+}
+
+.horizontal-nav .nav-brand {
+    font-size: 18px;
+    font-weight: 600;
+    color: #333;
+    text-decoration: none;
+}
+
+[data-theme="dark"] .horizontal-nav .nav-brand {
+    color: #fff;
+}
+
+.horizontal-nav .nav-links {
+    display: flex;
+    align-items: center;
+    gap: 30px;
+    list-style: none;
+    margin: 0;
+    padding: 0;
+}
+
+.horizontal-nav .nav-links a {
+    color: #666;
+    text-decoration: none;
+    font-size: 14px;
+    font-weight: 500;
+    padding: 8px 12px;
+    border-radius: 6px;
+    transition: all 0.2s ease;
+}
+
+.horizontal-nav .nav-links a:hover,
+.horizontal-nav .nav-links a.active {
+    color: #333;
+    background-color: #f5f5f5;
+}
+
+.horizontal-nav .nav-links a.active {
+    font-weight: 600;
+}
+
+[data-theme="dark"] .horizontal-nav .nav-links a {
+    color: #ccc;
+}
+
+[data-theme="dark"] .horizontal-nav .nav-links a:hover,
+[data-theme="dark"] .horizontal-nav .nav-links a.active {
+    color: #fff;
+    background-color: #333;
+}
+
+.horizontal-nav .nav-links .github-link {
+    display: flex;
+    align-items: center;
+    gap: 6px;
+}
+
+.horizontal-nav .nav-links .github-icon {
+    width: 16px;
+    height: 16px;
+    fill: currentColor;
+}
+
+/* Adjust main content to account for fixed nav */
+.wy-nav-side {
+    top: 50px;
+    height: calc(100vh - 50px);
+}
+
+.wy-nav-content-wrap {
+    margin-top: 50px;
+}
+
 .wy-nav-content {
     max-width: 90%;
 }
diff --git a/docs/_static/js/horizontal_nav.js b/docs/_static/js/horizontal_nav.js
new file mode 100644
index 000000000..c2384f9d5
--- /dev/null
+++ b/docs/_static/js/horizontal_nav.js
@@ -0,0 +1,44 @@
+// Horizontal Navigation Bar for Llama Stack Documentation
+document.addEventListener('DOMContentLoaded', function() {
+    // Create the horizontal navigation HTML
+    const navHTML = `
+        <nav class="horizontal-nav">
+            <div class="nav-container">
+                <a href="/" class="nav-brand">Llama Stack</a>
+                <ul class="nav-links">
+                    <li><a href="/">Docs</a></li>
+                    <li><a href="/references/api_reference/">API Reference</a></li>
+                    <li><a href="https://github.com/meta-llama/llama-stack" target="_blank" class="github-link">
+                        <svg class="github-icon" viewBox="0 0 16 16" aria-hidden="true">
+                            <path d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0016 8c0-4.42-3.58-8-8-8z"/>
+                        </svg>
+                        GitHub
+                    </a></li>
+                </ul>
+            </div>
+        </nav>
+    `;
+
+    // Insert the navigation at the beginning of the body
+    document.body.insertAdjacentHTML('afterbegin', navHTML);
+
+    // Update navigation links based on current page
+    updateActiveNav();
+});
+
+function updateActiveNav() {
+    const currentPath = window.location.pathname;
+    const navLinks = document.querySelectorAll('.horizontal-nav .nav-links a');
+
+    navLinks.forEach(link => {
+        // Remove any existing active classes
+        link.classList.remove('active');
+
+        // Add active class based on current path
+        if (currentPath === '/' && link.getAttribute('href') === '/') {
+            link.classList.add('active');
+        } else if (currentPath.includes('/references/api_reference/') && link.getAttribute('href').includes('api_reference')) {
+            link.classList.add('active');
+        }
+    });
+}
diff --git a/docs/source/conf.py b/docs/source/conf.py
index 3f84d1310..0cbddef31 100644
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@@ -131,6 +131,7 @@ html_static_path = ["../_static"]
 def setup(app):
     app.add_css_file("css/my_theme.css")
     app.add_js_file("js/detect_theme.js")
+    app.add_js_file("js/horizontal_nav.js")
     app.add_js_file("js/keyboard_shortcuts.js")
 
     def dockerhub_role(name, rawtext, text, lineno, inliner, options={}, content=[]):

From a844c4f6e189395f99a6470552876d1ba6b807f1 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 10 Sep 2025 13:17:02 -0700
Subject: [PATCH 63/76] chore(python-deps): bump pytest from 8.4.1 to 8.4.2
 (#3359)

Bumps [pytest](https://github.com/pytest-dev/pytest) from 8.4.1 to
8.4.2.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/pytest-dev/pytest/releases">pytest's
releases</a>.</em></p>
<blockquote>
<h2>8.4.2</h2>
<h1>pytest 8.4.2 (2025-09-03)</h1>
<h2>Bug fixes</h2>
<ul>
<li>
<p><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13478">#13478</a>:
Fixed a crash when using
<code>console_output_style</code>{.interpreted-text
role=&quot;confval&quot;} with <code>times</code> and a module is
skipped.</p>
</li>
<li>
<p><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13530">#13530</a>:
Fixed a crash when using <code>pytest.approx</code>{.interpreted-text
role=&quot;func&quot;} and
<code>decimal.Decimal</code>{.interpreted-text role=&quot;class&quot;}
instances with the <code>decimal.FloatOperation</code>{.interpreted-text
role=&quot;class&quot;} trap set.</p>
</li>
<li>
<p><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13549">#13549</a>:
No longer evaluate type annotations in Python <code>3.14</code> when
inspecting function signatures.</p>
<p>This prevents crashes during module collection when modules do not
explicitly use <code>from __future__ import annotations</code> and
import types for annotations within a <code>if TYPE_CHECKING:</code>
block.</p>
</li>
<li>
<p><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13559">#13559</a>:
Added missing [int]{.title-ref} and [float]{.title-ref} variants to the
[Literal]{.title-ref} type annotation of the [type]{.title-ref}
parameter in <code>pytest.Parser.addini</code>{.interpreted-text
role=&quot;meth&quot;}.</p>
</li>
<li>
<p><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13563">#13563</a>:
<code>pytest.approx</code>{.interpreted-text role=&quot;func&quot;} now
only imports <code>numpy</code> if NumPy is already in
<code>sys.modules</code>. This fixes unconditional import behavior
introduced in [8.4.0]{.title-ref}.</p>
</li>
</ul>
<h2>Improved documentation</h2>
<ul>
<li><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13577">#13577</a>:
Clarify that <code>pytest_generate_tests</code> is discovered in test
modules/classes; other hooks must be in <code>conftest.py</code> or
plugins.</li>
</ul>
<h2>Contributor-facing changes</h2>
<ul>
<li><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13480">#13480</a>:
Self-testing: fixed a few test failures when run with
<code>-Wdefault</code> or a similar override.</li>
<li><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13547">#13547</a>:
Self-testing: corrected expected message for
<code>test_doctest_unexpected_exception</code> in Python
<code>3.14</code>.</li>
<li><a
href="https://redirect.github.com/pytest-dev/pytest/issues/13684">#13684</a>:
Make pytest's own testsuite insensitive to the presence of the
<code>CI</code> environment variable -- by
<code>ogrisel</code>{.interpreted-text role=&quot;user&quot;}.</li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/pytest-dev/pytest/commit/bfae4224fd554d3d7f2c277a4cc092b6ec6af3ae"><code>bfae422</code></a>
Prepare release version 8.4.2</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/89905381a163be30ae87d62e5f750e902d750c5f"><code>8990538</code></a>
Fix passenv CI in tox ini and make tests insensitive to the presence of
the C...</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/ca676bfe005aebcb12f4146d1b0f1d2772e2cd5d"><code>ca676bf</code></a>
Merge pull request <a
href="https://redirect.github.com/pytest-dev/pytest/issues/13687">#13687</a>
from pytest-dev/patchback/backports/8.4.x/e63f6e51c...</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/975a60a63ce385a44655596e254c1899feaa53e4"><code>975a60a</code></a>
Merge pull request <a
href="https://redirect.github.com/pytest-dev/pytest/issues/13686">#13686</a>
from pytest-dev/patchback/backports/8.4.x/12bde8af6...</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/7723ce84b87ab08f86ddafcb342acc28ba5ec99d"><code>7723ce8</code></a>
Merge pull request <a
href="https://redirect.github.com/pytest-dev/pytest/issues/13683">#13683</a>
from even-even/fix_Exeption_to_Exception_in_errorMe...</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/b7f05680d1301e0969b30bcb3c4b27433c9ee2b7"><code>b7f0568</code></a>
Merge pull request <a
href="https://redirect.github.com/pytest-dev/pytest/issues/13685">#13685</a>
from CoretexShadow/fix/docs-pytest-generate-tests</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/2c94c4a6948ba53440818389298157fa5d5f94cd"><code>2c94c4a</code></a>
add missing colon (<a
href="https://redirect.github.com/pytest-dev/pytest/issues/13640">#13640</a>)
(<a
href="https://redirect.github.com/pytest-dev/pytest/issues/13641">#13641</a>)</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/c3d7684bc01c8c48d05145a30c5211ca8656c68c"><code>c3d7684</code></a>
Merge pull request <a
href="https://redirect.github.com/pytest-dev/pytest/issues/13606">#13606</a>
from pytest-dev/patchback/backports/8.4.x/5f9938563...</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/dc6e3be2ddc75a149b6d102d9b7c82ee47a00cfa"><code>dc6e3be</code></a>
Merge pull request <a
href="https://redirect.github.com/pytest-dev/pytest/issues/13605">#13605</a>
from The-Compiler/training-update-2025-07</li>
<li><a
href="https://github.com/pytest-dev/pytest/commit/f87289c36c8dbe7740e3020f5546b6f8b0861ff0"><code>f87289c</code></a>
Fix crash with <code>times</code> output style and skipped module (<a
href="https://redirect.github.com/pytest-dev/pytest/issues/13573">#13573</a>)
(<a
href="https://redirect.github.com/pytest-dev/pytest/issues/13579">#13579</a>)</li>
<li>Additional commits viewable in <a
href="https://github.com/pytest-dev/pytest/compare/8.4.1...8.4.2">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=pytest&package-manager=uv&previous-version=8.4.1&new-version=8.4.2)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 uv.lock | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/uv.lock b/uv.lock
index 2788c6fef..6f8ba7ad6 100644
--- a/uv.lock
+++ b/uv.lock
@@ -3540,7 +3540,7 @@ wheels = [
 
 [[package]]
 name = "pytest"
-version = "8.4.1"
+version = "8.4.2"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "colorama", marker = "sys_platform == 'win32'" },
@@ -3549,9 +3549,9 @@ dependencies = [
     { name = "pluggy" },
     { name = "pygments" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/08/ba/45911d754e8eba3d5a841a5ce61a65a685ff1798421ac054f85aa8747dfb/pytest-8.4.1.tar.gz", hash = "sha256:7c67fd69174877359ed9371ec3af8a3d2b04741818c51e5e99cc1742251fa93c", size = 1517714, upload-time = "2025-06-18T05:48:06.109Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/a3/5c/00a0e072241553e1a7496d638deababa67c5058571567b92a7eaa258397c/pytest-8.4.2.tar.gz", hash = "sha256:86c0d0b93306b961d58d62a4db4879f27fe25513d4b969df351abdddb3c30e01", size = 1519618, upload-time = "2025-09-04T14:34:22.711Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/29/16/c8a903f4c4dffe7a12843191437d7cd8e32751d5de349d45d3fe69544e87/pytest-8.4.1-py3-none-any.whl", hash = "sha256:539c70ba6fcead8e78eebbf1115e8b589e7565830d7d006a8723f19ac8a0afb7", size = 365474, upload-time = "2025-06-18T05:48:03.955Z" },
+    { url = "https://files.pythonhosted.org/packages/a8/a4/20da314d277121d6534b3a980b29035dcd51e6744bd79075a6ce8fa4eb8d/pytest-8.4.2-py3-none-any.whl", hash = "sha256:872f880de3fc3a5bdc88a11b39c9710c3497a547cfa9320bc3c5e62fbf272e79", size = 365750, upload-time = "2025-09-04T14:34:20.226Z" },
 ]
 
 [[package]]

From 369083c0699270d7a3fa4d10f4975a081fcc7acd Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 10 Sep 2025 13:17:28 -0700
Subject: [PATCH 64/76] chore(python-deps): bump locust from 2.39.1 to 2.40.1
 (#3358)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps [locust](https://github.com/locustio/locust) from 2.39.1 to
2.40.1.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/locustio/locust/releases">locust's
releases</a>.</em></p>
<blockquote>
<h2>2.40.1</h2>
<h2>What's Changed</h2>
<ul>
<li>Pytest plugin: Delay imports to avoid monkey patching until someone
uses the fixtures by <a
href="https://github.com/cyberw"><code>@​cyberw</code></a> in <a
href="https://redirect.github.com/locustio/locust/pull/3204">locustio/locust#3204</a></li>
<li>Move pytest plugin to its own directory, to prevent accidental
import by <a href="https://github.com/cyberw"><code>@​cyberw</code></a>
in <a
href="https://redirect.github.com/locustio/locust/pull/3205">locustio/locust#3205</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/locustio/locust/compare/2.40.0...2.40.1">https://github.com/locustio/locust/compare/2.40.0...2.40.1</a></p>
<h2>2.40.0</h2>
<h2>What's Changed</h2>
<ul>
<li>Refactor FastHttpSession to be more like HttpSession by <a
href="https://github.com/cyberw"><code>@​cyberw</code></a> in <a
href="https://redirect.github.com/locustio/locust/pull/3198">locustio/locust#3198</a></li>
<li>Update Dockerfile base to Python 3.13 by <a
href="https://github.com/adaamz"><code>@​adaamz</code></a> in <a
href="https://redirect.github.com/locustio/locust/pull/3193">locustio/locust#3193</a></li>
<li>Avoid exception in HttpUser if requests has lost track of the
request it made by <a
href="https://github.com/cyberw"><code>@​cyberw</code></a> in <a
href="https://redirect.github.com/locustio/locust/pull/3201">locustio/locust#3201</a></li>
<li>Support pytests as locustfiles by <a
href="https://github.com/cyberw"><code>@​cyberw</code></a> in <a
href="https://redirect.github.com/locustio/locust/pull/3200">locustio/locust#3200</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/adaamz"><code>@​adaamz</code></a> made
their first contribution in <a
href="https://redirect.github.com/locustio/locust/pull/3193">locustio/locust#3193</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a
href="https://github.com/locustio/locust/compare/2.39.1...2.40.0">https://github.com/locustio/locust/compare/2.39.1...2.40.0</a></p>
</blockquote>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a
href="https://github.com/locustio/locust/blob/master/CHANGELOG.md">locust's
changelog</a>.</em></p>
<blockquote>
<h1>Detailed changelog</h1>
<p>The most important changes can also be found in <a
href="https://docs.locust.io/en/latest/changelog.html">the
documentation</a>.</p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/locustio/locust/commit/5df19da06a0f8418d44094f3014ddee3b307bb55"><code>5df19da</code></a>
Merge pull request <a
href="https://redirect.github.com/locustio/locust/issues/3205">#3205</a>
from locustio/move-pytest-plugin-to-own-directory</li>
<li><a
href="https://github.com/locustio/locust/commit/d41141bedd3bbafd894adccaa3cf05b7cf0990fd"><code>d41141b</code></a>
Move pytest plugin to its own directory, to prevent accidental import of
locu...</li>
<li><a
href="https://github.com/locustio/locust/commit/6422848afd072032005f2eafa9ed4db11238708a"><code>6422848</code></a>
mention that only one locustfile can be distributed</li>
<li><a
href="https://github.com/locustio/locust/commit/aa3da739fe37baf4f31a99a89776e4380aabd13b"><code>aa3da73</code></a>
Merge pull request <a
href="https://redirect.github.com/locustio/locust/issues/3204">#3204</a>
from locustio/delay-imports-in-pytest-plugin-to-avoi...</li>
<li><a
href="https://github.com/locustio/locust/commit/12050dedfd5925beed067eba5a9732d2cd4865ca"><code>12050de</code></a>
Pytest plugin: Delay imports to avoid monkey patching until someone
actually ...</li>
<li><a
href="https://github.com/locustio/locust/commit/488d1f849121335ce36d502f7cfe94c82cbea499"><code>488d1f8</code></a>
docs</li>
<li><a
href="https://github.com/locustio/locust/commit/439b7ab91bc8dd00a423d111c452133bdaaae872"><code>439b7ab</code></a>
docs fix</li>
<li><a
href="https://github.com/locustio/locust/commit/fcd76a8ac341c83cd0a2a315d2942c12e43a8d9f"><code>fcd76a8</code></a>
docs: rephrase</li>
<li><a
href="https://github.com/locustio/locust/commit/70c7e9b2d8326af33b5253f163a2d2e7e9e8e6dd"><code>70c7e9b</code></a>
docs: move pytest further up</li>
<li><a
href="https://github.com/locustio/locust/commit/06dbf98013f56b22451158e0b23c9014dc9814f9"><code>06dbf98</code></a>
docs: fix link</li>
<li>Additional commits viewable in <a
href="https://github.com/locustio/locust/compare/2.39.1...2.40.1">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=locust&package-manager=uv&previous-version=2.39.1&new-version=2.40.1)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 uv.lock | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/uv.lock b/uv.lock
index 6f8ba7ad6..df3a23e58 100644
--- a/uv.lock
+++ b/uv.lock
@@ -2023,7 +2023,7 @@ wheels = [
 
 [[package]]
 name = "locust"
-version = "2.39.1"
+version = "2.40.1"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "configargparse" },
@@ -2035,6 +2035,7 @@ dependencies = [
     { name = "locust-cloud" },
     { name = "msgpack" },
     { name = "psutil" },
+    { name = "pytest" },
     { name = "python-engineio" },
     { name = "python-socketio", extra = ["client"] },
     { name = "pywin32", marker = "sys_platform == 'win32'" },
@@ -2043,9 +2044,9 @@ dependencies = [
     { name = "setuptools" },
     { name = "werkzeug" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/95/c8/10aa5445c404eed389b56877e6714c1787190cc09dd70059ce3765979ec5/locust-2.39.1.tar.gz", hash = "sha256:6bdd19e27edf9a1c84391d6cf6e9a737dfb832be7dfbf39053191ae31b9cc498", size = 1409902, upload-time = "2025-08-29T17:41:01.544Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/01/22/82f40176473a98c9479bed667d3ad21bb859d2cb67f6880a6b0b6a725e45/locust-2.40.1.tar.gz", hash = "sha256:5bde76c1cf7e412071670f926f34844e119210c93f07a4cf9fc4cb93c60a578a", size = 1411606, upload-time = "2025-09-05T15:57:35.76Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/ec/b3/b2f4b2ca88b1e72eba7be2b2982533b887f8b709d222db78eb9602aa5121/locust-2.39.1-py3-none-any.whl", hash = "sha256:fd5148f2f1a4ed34aee968abc4393674e69d1b5e1b54db50a397f6eb09ce0b04", size = 1428155, upload-time = "2025-08-29T17:41:00.245Z" },
+    { url = "https://files.pythonhosted.org/packages/3b/e6/9c6335ab16becf4f8ad3da6083ab78793c56ec1ca496d6f7c74660c21c3f/locust-2.40.1-py3-none-any.whl", hash = "sha256:ef0517f9bb5ed0afa7035014faaf944802917e07da8649461aaaf5e5f3ba8a65", size = 1430154, upload-time = "2025-09-05T15:57:33.233Z" },
 ]
 
 [[package]]

From 438c037b1f16ee8123ab71b2aa39529ce32967a5 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 10 Sep 2025 13:17:43 -0700
Subject: [PATCH 65/76] chore(python-deps): bump openai from 1.102.0 to 1.106.1
 (#3356)

Bumps [openai](https://github.com/openai/openai-python) from 1.102.0 to
1.106.1.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/openai/openai-python/releases">openai's
releases</a>.</em></p>
<blockquote>
<h2>v1.106.1</h2>
<h2>1.106.1 (2025-09-04)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.106.0...v1.106.1">v1.106.0...v1.106.1</a></p>
<h3>Chores</h3>
<ul>
<li><strong>internal:</strong> move mypy configurations to
<code>pyproject.toml</code> file (<a
href="https://github.com/openai/openai-python/commit/ca413a277496c3b883b103ad1138a886e89ae15e">ca413a2</a>)</li>
</ul>
<h2>v1.106.0</h2>
<h2>1.106.0 (2025-09-04)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.105.0...v1.106.0">v1.105.0...v1.106.0</a></p>
<h3>Features</h3>
<ul>
<li><strong>client:</strong> support callable api_key (<a
href="https://redirect.github.com/openai/openai-python/issues/2588">#2588</a>)
(<a
href="https://github.com/openai/openai-python/commit/e1bad015b8a2b98bfee955a24bc931347a58efc1">e1bad01</a>)</li>
<li>improve future compat with pydantic v3 (<a
href="https://github.com/openai/openai-python/commit/6645d9317a240982928b92c2f4af0381db6edc09">6645d93</a>)</li>
</ul>
<h2>v1.105.0</h2>
<h2>1.105.0 (2025-09-03)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.104.2...v1.105.0">v1.104.2...v1.105.0</a></p>
<h3>Features</h3>
<ul>
<li><strong>api:</strong> Add gpt-realtime models (<a
href="https://github.com/openai/openai-python/commit/85020414808314df9cb42e020b11baff12f18f16">8502041</a>)</li>
</ul>
<h2>v1.104.2</h2>
<h2>1.104.2 (2025-09-02)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.104.1...v1.104.2">v1.104.1...v1.104.2</a></p>
<h3>Bug Fixes</h3>
<ul>
<li><strong>types:</strong> add aliases back for web search tool types
(<a
href="https://github.com/openai/openai-python/commit/2521cd8445906e418dbae783b0d7c375ad91d49d">2521cd8</a>)</li>
</ul>
<h2>v1.104.1</h2>
<h2>1.104.1 (2025-09-02)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.104.0...v1.104.1">v1.104.0...v1.104.1</a></p>
<h3>Chores</h3>
<ul>
<li><strong>api:</strong> manual updates for ResponseInputAudio (<a
href="https://github.com/openai/openai-python/commit/0db50619663656ba97bba30ab640bbb33683d196">0db5061</a>)</li>
</ul>
<h2>v1.104.0</h2>
<h2>1.104.0 (2025-09-02)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.103.0...v1.104.0">v1.103.0...v1.104.0</a></p>
<!-- raw HTML omitted -->
</blockquote>
<p>... (truncated)</p>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a
href="https://github.com/openai/openai-python/blob/main/CHANGELOG.md">openai's
changelog</a>.</em></p>
<blockquote>
<h2>1.106.1 (2025-09-04)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.106.0...v1.106.1">v1.106.0...v1.106.1</a></p>
<h3>Chores</h3>
<ul>
<li><strong>internal:</strong> move mypy configurations to
<code>pyproject.toml</code> file (<a
href="https://github.com/openai/openai-python/commit/ca413a277496c3b883b103ad1138a886e89ae15e">ca413a2</a>)</li>
</ul>
<h2>1.106.0 (2025-09-04)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.105.0...v1.106.0">v1.105.0...v1.106.0</a></p>
<h3>Features</h3>
<ul>
<li><strong>client:</strong> support callable api_key (<a
href="https://redirect.github.com/openai/openai-python/issues/2588">#2588</a>)
(<a
href="https://github.com/openai/openai-python/commit/e1bad015b8a2b98bfee955a24bc931347a58efc1">e1bad01</a>)</li>
<li>improve future compat with pydantic v3 (<a
href="https://github.com/openai/openai-python/commit/6645d9317a240982928b92c2f4af0381db6edc09">6645d93</a>)</li>
</ul>
<h2>1.105.0 (2025-09-03)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.104.2...v1.105.0">v1.104.2...v1.105.0</a></p>
<h3>Features</h3>
<ul>
<li><strong>api:</strong> Add gpt-realtime models (<a
href="https://github.com/openai/openai-python/commit/85020414808314df9cb42e020b11baff12f18f16">8502041</a>)</li>
</ul>
<h2>1.104.2 (2025-09-02)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.104.1...v1.104.2">v1.104.1...v1.104.2</a></p>
<h3>Bug Fixes</h3>
<ul>
<li><strong>types:</strong> add aliases back for web search tool types
(<a
href="https://github.com/openai/openai-python/commit/2521cd8445906e418dbae783b0d7c375ad91d49d">2521cd8</a>)</li>
</ul>
<h2>1.104.1 (2025-09-02)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.104.0...v1.104.1">v1.104.0...v1.104.1</a></p>
<h3>Chores</h3>
<ul>
<li><strong>api:</strong> manual updates for ResponseInputAudio (<a
href="https://github.com/openai/openai-python/commit/0db50619663656ba97bba30ab640bbb33683d196">0db5061</a>)</li>
</ul>
<h2>1.104.0 (2025-09-02)</h2>
<p>Full Changelog: <a
href="https://github.com/openai/openai-python/compare/v1.103.0...v1.104.0">v1.103.0...v1.104.0</a></p>
<h3>Features</h3>
<ul>
<li><strong>types:</strong> replace List[str] with SequenceNotStr in
params (<a
href="https://github.com/openai/openai-python/commit/bc00bda880a80089be8a1758c016266ca72dab2c">bc00bda</a>)</li>
</ul>
<!-- raw HTML omitted -->
</blockquote>
<p>... (truncated)</p>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/openai/openai-python/commit/2adf11112988e998fcf5adb805bae38501d22318"><code>2adf111</code></a>
release: 1.106.1</li>
<li><a
href="https://github.com/openai/openai-python/commit/c4f9d0b997e18614709752e030f85d9e8281b4e0"><code>c4f9d0b</code></a>
chore(internal): move mypy configurations to <code>pyproject.toml</code>
file</li>
<li><a
href="https://github.com/openai/openai-python/commit/2de8d7cde5565ec71851d8bc3a26f021cebab32c"><code>2de8d7c</code></a>
release: 1.106.0</li>
<li><a
href="https://github.com/openai/openai-python/commit/2cf4ed5072f89103c674a61d22879b06a4c407f6"><code>2cf4ed5</code></a>
feat: improve future compat with pydantic v3</li>
<li><a
href="https://github.com/openai/openai-python/commit/25d16be18bcd11e00a853e8f4af881c76098e0d0"><code>25d16be</code></a>
feat(client): support callable api_key (<a
href="https://redirect.github.com/openai/openai-python/issues/2588">#2588</a>)</li>
<li><a
href="https://github.com/openai/openai-python/commit/8672413735889e83e74e7e133b976fe6029843a5"><code>8672413</code></a>
release: 1.105.0</li>
<li><a
href="https://github.com/openai/openai-python/commit/2c60d78b378465433b70bbe2a7d3f94c8eeaa0d5"><code>2c60d78</code></a>
feat(api): Add gpt-realtime models</li>
<li><a
href="https://github.com/openai/openai-python/commit/a52463c93215a09f9a142e25c975935523d15c10"><code>a52463c</code></a>
release: 1.104.2</li>
<li><a
href="https://github.com/openai/openai-python/commit/5a6931dafdf73d9dbfce62c3a7c585b95daaf009"><code>5a6931d</code></a>
fix(types): add aliases back for web search tool types</li>
<li><a
href="https://github.com/openai/openai-python/commit/fb152d967edb181c1a17827f31a4df10e416e255"><code>fb152d9</code></a>
release: 1.104.1</li>
<li>Additional commits viewable in <a
href="https://github.com/openai/openai-python/compare/v1.102.0...v1.106.1">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=openai&package-manager=uv&previous-version=1.102.0&new-version=1.106.1)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 uv.lock | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/uv.lock b/uv.lock
index df3a23e58..3d7713f54 100644
--- a/uv.lock
+++ b/uv.lock
@@ -2620,7 +2620,7 @@ wheels = [
 
 [[package]]
 name = "openai"
-version = "1.102.0"
+version = "1.107.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "anyio" },
@@ -2632,9 +2632,9 @@ dependencies = [
     { name = "tqdm" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/07/55/da5598ed5c6bdd9939633854049cddc5cbac0da938dfcfcb3c6b119c16c0/openai-1.102.0.tar.gz", hash = "sha256:2e0153bcd64a6523071e90211cbfca1f2bbc5ceedd0993ba932a5869f93b7fc9", size = 519027, upload-time = "2025-08-26T20:50:29.397Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/88/67/d6498de300f83ff57a79cb7aa96ef3bef8d6f070c3ded0f1b5b45442a6bc/openai-1.107.0.tar.gz", hash = "sha256:43e04927584e57d0e9e640ee0077c78baf8150098be96ebd5c512539b6c4e9a4", size = 566056, upload-time = "2025-09-08T19:25:47.604Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/bd/0d/c9e7016d82c53c5b5e23e2bad36daebb8921ed44f69c0a985c6529a35106/openai-1.102.0-py3-none-any.whl", hash = "sha256:d751a7e95e222b5325306362ad02a7aa96e1fab3ed05b5888ce1c7ca63451345", size = 812015, upload-time = "2025-08-26T20:50:27.219Z" },
+    { url = "https://files.pythonhosted.org/packages/91/ed/e8a4fd20390f2858b95227c288df8fe0c835f7c77625f7583609161684ba/openai-1.107.0-py3-none-any.whl", hash = "sha256:3dcfa3cbb116bd6924b27913b8da28c4a787379ff60049588547a1013e6d6438", size = 950968, upload-time = "2025-09-08T19:25:45.552Z" },
 ]
 
 [[package]]

From d4e45cd5f1e099d9f6ac2d52ad6cd3f74cc4facf Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 10 Sep 2025 13:18:14 -0700
Subject: [PATCH 66/76] chore(ui-deps): bump tailwindcss from 4.1.6 to 4.1.13
 in /llama_stack/ui (#3362)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps
[tailwindcss](https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss)
from 4.1.6 to 4.1.13.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a
href="https://github.com/tailwindlabs/tailwindcss/releases">tailwindcss's
releases</a>.</em></p>
<blockquote>
<h2>v4.1.13</h2>
<h3>Changed</h3>
<ul>
<li>Drop warning from browser build (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/issues/18731">#18731</a>)</li>
<li>Drop exact duplicate declarations when emitting CSS (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/issues/18809">#18809</a>)</li>
</ul>
<h3>Fixed</h3>
<ul>
<li>Don't transition <code>visibility</code> when using
<code>transition</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18795">#18795</a>)</li>
<li>Discard matched variants with unknown named values (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18799">#18799</a>)</li>
<li>Discard matched variants with non-string values (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18799">#18799</a>)</li>
<li>Show suggestions for known <code>matchVariant</code> values (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18798">#18798</a>)</li>
<li>Replace deprecated <code>clip</code> with <code>clip-path</code> in
<code>sr-only</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18769">#18769</a>)</li>
<li>Hide internal fields from completions in <code>matchUtilities</code>
(<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18820">#18820</a>)</li>
<li>Ignore <code>.vercel</code> folders by default (can be overridden by
<code>@source …</code> rules) (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18855">#18855</a>)</li>
<li>Consider variants starting with <code>@-</code> to be invalid (e.g.
<code>@-2xl:flex</code>) (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18869">#18869</a>)</li>
<li>Do not allow custom variants to start or end with a <code>-</code>
or <code>_</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18867">#18867</a>,
<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18872">#18872</a>)</li>
<li>Upgrade: Migrate <code>aria</code> theme keys to
<code>@custom-variant</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18815">#18815</a>)</li>
<li>Upgrade: Migrate <code>data</code> theme keys to
<code>@custom-variant</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18816">#18816</a>)</li>
<li>Upgrade: Migrate <code>supports</code> theme keys to
<code>@custom-variant</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18817">#18817</a>)</li>
</ul>
<h2>v4.1.12</h2>
<h3>Fixed</h3>
<ul>
<li>Don't consider the global important state in <code>@apply</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18404">#18404</a>)</li>
<li>Add missing suggestions for <code>flex-&lt;number&gt;</code>
utilities (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18642">#18642</a>)</li>
<li>Fix trailing <code>)</code> from interfering with extraction in
Clojure keywords (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18345">#18345</a>)</li>
<li>Detect classes inside Elixir charlist, word list, and string sigils
(<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18432">#18432</a>)</li>
<li>Track source locations through <code>@plugin</code> and
<code>@config</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18345">#18345</a>)</li>
<li>Allow boolean values of <code>process.env.DEBUG</code> in
<code>@tailwindcss/node</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18485">#18485</a>)</li>
<li>Ignore consecutive semicolons in the CSS parser (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18532">#18532</a>)</li>
<li>Center the dropdown icon added to an input with a paired datalist by
default (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18511">#18511</a>)</li>
<li>Extract candidates in Slang templates (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18565">#18565</a>)</li>
<li>Improve error messages when encountering invalid functional utility
names (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18568">#18568</a>)</li>
<li>Discard CSS AST objects with <code>false</code> or
<code>undefined</code> properties (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18571">#18571</a>)</li>
<li>Allow users to disable URL rebasing in
<code>@tailwindcss/postcss</code> via <code>transformAssetUrls:
false</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18321">#18321</a>)</li>
<li>Fix false-positive migrations in <code>addEventListener</code> and
JavaScript variable names (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18718">#18718</a>)</li>
<li>Fix Standalone CLI showing default Bun help when run via symlink on
Windows (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18723">#18723</a>)</li>
<li>Read from <code>--border-color-*</code> theme keys in
<code>divide-*</code> utilities for backwards compatibility (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18704/">#18704</a>)</li>
<li>Don't scan <code>.hdr</code> and <code>.exr</code> files for classes
by default (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18734">#18734</a>)</li>
</ul>
<h2>v4.1.11</h2>
<h3>Fixed</h3>
<ul>
<li>Add heuristic to skip candidate migrations inside
<code>emit(…)</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18330">#18330</a>)</li>
<li>Extract candidates with variants in Clojure/ClojureScript keywords
(<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18338">#18338</a>)</li>
<li>Document <code>--watch=always</code> in the CLI's usage (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18337">#18337</a>)</li>
<li>Add support for Vite 7 to <code>@tailwindcss/vite</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18384">#18384</a>)</li>
</ul>
<h2>v4.1.10</h2>
<!-- raw HTML omitted -->
</blockquote>
<p>... (truncated)</p>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a
href="https://github.com/tailwindlabs/tailwindcss/blob/main/CHANGELOG.md">tailwindcss's
changelog</a>.</em></p>
<blockquote>
<h2>[4.1.13] - 2025-09-03</h2>
<h3>Changed</h3>
<ul>
<li>Drop warning from browser build (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/issues/18731">#18731</a>)</li>
<li>Drop exact duplicate declarations when emitting CSS (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/issues/18809">#18809</a>)</li>
</ul>
<h3>Fixed</h3>
<ul>
<li>Don't transition <code>visibility</code> when using
<code>transition</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18795">#18795</a>)</li>
<li>Discard matched variants with unknown named values (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18799">#18799</a>)</li>
<li>Discard matched variants with non-string values (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18799">#18799</a>)</li>
<li>Show suggestions for known <code>matchVariant</code> values (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18798">#18798</a>)</li>
<li>Replace deprecated <code>clip</code> with <code>clip-path</code> in
<code>sr-only</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18769">#18769</a>)</li>
<li>Hide internal fields from completions in <code>matchUtilities</code>
(<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18820">#18820</a>)</li>
<li>Ignore <code>.vercel</code> folders by default (can be overridden by
<code>@source …</code> rules) (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18855">#18855</a>)</li>
<li>Consider variants starting with <code>@-</code> to be invalid (e.g.
<code>@-2xl:flex</code>) (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18869">#18869</a>)</li>
<li>Do not allow custom variants to start or end with a <code>-</code>
or <code>_</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18867">#18867</a>,
<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18872">#18872</a>)</li>
<li>Upgrade: Migrate <code>aria</code> theme keys to
<code>@custom-variant</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18815">#18815</a>)</li>
<li>Upgrade: Migrate <code>data</code> theme keys to
<code>@custom-variant</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18816">#18816</a>)</li>
<li>Upgrade: Migrate <code>supports</code> theme keys to
<code>@custom-variant</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18817">#18817</a>)</li>
</ul>
<h2>[4.1.12] - 2025-08-13</h2>
<h3>Fixed</h3>
<ul>
<li>Don't consider the global important state in <code>@apply</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18404">#18404</a>)</li>
<li>Add missing suggestions for <code>flex-&lt;number&gt;</code>
utilities (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18642">#18642</a>)</li>
<li>Fix trailing <code>)</code> from interfering with extraction in
Clojure keywords (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18345">#18345</a>)</li>
<li>Detect classes inside Elixir charlist, word list, and string sigils
(<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18432">#18432</a>)</li>
<li>Track source locations through <code>@plugin</code> and
<code>@config</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18345">#18345</a>)</li>
<li>Allow boolean values of <code>process.env.DEBUG</code> in
<code>@tailwindcss/node</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18485">#18485</a>)</li>
<li>Ignore consecutive semicolons in the CSS parser (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18532">#18532</a>)</li>
<li>Center the dropdown icon added to an input with a paired datalist by
default (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18511">#18511</a>)</li>
<li>Extract candidates in Slang templates (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18565">#18565</a>)</li>
<li>Improve error messages when encountering invalid functional utility
names (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18568">#18568</a>)</li>
<li>Discard CSS AST objects with <code>false</code> or
<code>undefined</code> properties (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18571">#18571</a>)</li>
<li>Allow users to disable URL rebasing in
<code>@tailwindcss/postcss</code> via <code>transformAssetUrls:
false</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18321">#18321</a>)</li>
<li>Fix false-positive migrations in <code>addEventListener</code> and
JavaScript variable names (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18718">#18718</a>)</li>
<li>Fix Standalone CLI showing default Bun help when run via symlink on
Windows (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18723">#18723</a>)</li>
<li>Read from <code>--border-color-*</code> theme keys in
<code>divide-*</code> utilities for backwards compatibility (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18704/">#18704</a>)</li>
<li>Don't scan <code>.hdr</code> and <code>.exr</code> files for classes
by default (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18734">#18734</a>)</li>
</ul>
<h2>[4.1.11] - 2025-06-26</h2>
<h3>Fixed</h3>
<ul>
<li>Add heuristic to skip candidate migrations inside
<code>emit(…)</code> (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18330">#18330</a>)</li>
<li>Extract candidates with variants in Clojure/ClojureScript keywords
(<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18338">#18338</a>)</li>
<li>Document <code>--watch=always</code> in the CLI's usage (<a
href="https://redirect.github.com/tailwindlabs/tailwindcss/pull/18337">#18337</a>)</li>
</ul>
<!-- raw HTML omitted -->
</blockquote>
<p>... (truncated)</p>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/1334c99db8fd26c8ea065375dd9259800863f072"><code>1334c99</code></a>
Prepare v4.1.13 release (<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18868">#18868</a>)</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/65dc530f0575da14f8258af7feb5bb687e170904"><code>65dc530</code></a>
Do not allow variants to end with <code>-</code> or <code>_</code> (<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18872">#18872</a>)</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/54c3f308e912a5b4107cd70625319da4d28ac51f"><code>54c3f30</code></a>
Do not allow variants to start with <code>-</code> (<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18867">#18867</a>)</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/494051ca087aa0dc7e877af52f75601a1308a114"><code>494051c</code></a>
Consider variants starting with <code>@-</code> to be invalid (e.g.
<code>@-2xl:flex</code>) (<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18869">#18869</a>)</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/c318329a1ee05d62b67cb681a7d6f54ee5e1bb65"><code>c318329</code></a>
chore: remove redundant words (<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18853">#18853</a>)</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/ddc84b079b1d543d3297f30312c9c1fe1a66987c"><code>ddc84b0</code></a>
update test after prettier change</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/f1331a857a80147f0c63393d335d034de1d4c374"><code>f1331a8</code></a>
run prettier</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/e5513b6c75c9e830ced45e939f2a2b855440ede2"><code>e5513b6</code></a>
Fix missing code block delimiters in comment blocks (<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18837">#18837</a>)</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/5e2a160d8b1a6be12a54765a1b8ada26960d8b89"><code>5e2a160</code></a>
Drop exact duplicate declarations from output CSS within a style rule
(<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18809">#18809</a>)</li>
<li><a
href="https://github.com/tailwindlabs/tailwindcss/commit/b1fb02a2d7c01c2b7c1b08e7d1838380a95081d7"><code>b1fb02a</code></a>
Hide internal fields from completions in <code>matchUtilities</code> (<a
href="https://github.com/tailwindlabs/tailwindcss/tree/HEAD/packages/tailwindcss/issues/18820">#18820</a>)</li>
<li>Additional commits viewable in <a
href="https://github.com/tailwindlabs/tailwindcss/commits/v4.1.13/packages/tailwindcss">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility
score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=tailwindcss&package-manager=npm_and_yarn&previous-version=4.1.6&new-version=4.1.13)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase`.

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

---

<details>
<summary>Dependabot commands and options</summary>
<br />

You can trigger Dependabot actions by commenting on this PR:
- `@dependabot rebase` will rebase this PR
- `@dependabot recreate` will recreate this PR, overwriting any edits
that have been made to it
- `@dependabot merge` will merge this PR after your CI passes on it
- `@dependabot squash and merge` will squash and merge this PR after
your CI passes on it
- `@dependabot cancel merge` will cancel a previously requested merge
and block automerging
- `@dependabot reopen` will reopen this PR if it is closed
- `@dependabot close` will close this PR and stop Dependabot recreating
it. You can achieve the same result by closing it manually
- `@dependabot show <dependency name> ignore conditions` will show all
of the ignore conditions of the specified dependency
- `@dependabot ignore this major version` will close this PR and stop
Dependabot creating any more for this major version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this minor version` will close this PR and stop
Dependabot creating any more for this minor version (unless you reopen
the PR or upgrade to it yourself)
- `@dependabot ignore this dependency` will close this PR and stop
Dependabot creating any more for this dependency (unless you reopen the
PR or upgrade to it yourself)


</details>

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 llama_stack/ui/package-lock.json | 20 +++++++++++++++++---
 1 file changed, 17 insertions(+), 3 deletions(-)

diff --git a/llama_stack/ui/package-lock.json b/llama_stack/ui/package-lock.json
index 1db1c61cd..e2c0815fd 100644
--- a/llama_stack/ui/package-lock.json
+++ b/llama_stack/ui/package-lock.json
@@ -3578,6 +3578,13 @@
         "tailwindcss": "4.1.6"
       }
     },
+    "node_modules/@tailwindcss/node/node_modules/tailwindcss": {
+      "version": "4.1.6",
+      "resolved": "https://registry.npmjs.org/tailwindcss/-/tailwindcss-4.1.6.tgz",
+      "integrity": "sha512-j0cGLTreM6u4OWzBeLBpycK0WIh8w7kSwcUsQZoGLHZ7xDTdM69lN64AgoIEEwFi0tnhs4wSykUa5YWxAzgFYg==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/@tailwindcss/oxide": {
       "version": "4.1.6",
       "resolved": "https://registry.npmjs.org/@tailwindcss/oxide/-/oxide-4.1.6.tgz",
@@ -3838,6 +3845,13 @@
         "tailwindcss": "4.1.6"
       }
     },
+    "node_modules/@tailwindcss/postcss/node_modules/tailwindcss": {
+      "version": "4.1.6",
+      "resolved": "https://registry.npmjs.org/tailwindcss/-/tailwindcss-4.1.6.tgz",
+      "integrity": "sha512-j0cGLTreM6u4OWzBeLBpycK0WIh8w7kSwcUsQZoGLHZ7xDTdM69lN64AgoIEEwFi0tnhs4wSykUa5YWxAzgFYg==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/@testing-library/dom": {
       "version": "10.4.1",
       "resolved": "https://registry.npmjs.org/@testing-library/dom/-/dom-10.4.1.tgz",
@@ -13843,9 +13857,9 @@
       }
     },
     "node_modules/tailwindcss": {
-      "version": "4.1.6",
-      "resolved": "https://registry.npmjs.org/tailwindcss/-/tailwindcss-4.1.6.tgz",
-      "integrity": "sha512-j0cGLTreM6u4OWzBeLBpycK0WIh8w7kSwcUsQZoGLHZ7xDTdM69lN64AgoIEEwFi0tnhs4wSykUa5YWxAzgFYg==",
+      "version": "4.1.13",
+      "resolved": "https://registry.npmjs.org/tailwindcss/-/tailwindcss-4.1.13.tgz",
+      "integrity": "sha512-i+zidfmTqtwquj4hMEwdjshYYgMbOrPzb9a0M3ZgNa0JMoZeFC6bxZvO8yr8ozS6ix2SDz0+mvryPeBs2TFE+w==",
       "dev": true,
       "license": "MIT"
     },

From d2f88a10fb0cf366708ec106696c812b8c85629c Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Wed, 10 Sep 2025 13:19:36 -0700
Subject: [PATCH 67/76] chore: telemetry test (#3405)

# What does this PR do?
- removed fixed-duration sleeps

## Test Plan
---
 .../telemetry/test_openai_telemetry.py          | 17 ++++++++---------
 tests/integration/telemetry/test_telemetry.py   |  5 +----
 .../telemetry/test_telemetry_metrics.py         |  5 +----
 3 files changed, 10 insertions(+), 17 deletions(-)

diff --git a/tests/integration/telemetry/test_openai_telemetry.py b/tests/integration/telemetry/test_openai_telemetry.py
index cdd9b6702..b3ffb6b09 100644
--- a/tests/integration/telemetry/test_openai_telemetry.py
+++ b/tests/integration/telemetry/test_openai_telemetry.py
@@ -49,16 +49,13 @@ def setup_openai_telemetry_data(llama_stack_client, text_model_id):
         traces = llama_stack_client.telemetry.query_traces(limit=10)
         if len(traces) >= 5:  # 5 OpenAI completion traces
             break
-        time.sleep(1)
+        time.sleep(0.1)
 
     if len(traces) < 5:
         pytest.fail(
             f"Failed to create sufficient OpenAI completion telemetry data after 30s. Got {len(traces)} traces."
         )
 
-    # Wait for 5 seconds to ensure traces has completed logging
-    time.sleep(5)
-
     yield
 
 
@@ -185,11 +182,13 @@ def test_openai_completion_creates_telemetry(llama_stack_client, text_model_id):
     assert len(response.choices) > 0, "Response should have at least one choice"
 
     # Wait for telemetry to be recorded
-    time.sleep(3)
-
-    # Check that we have more traces now
-    final_traces = llama_stack_client.telemetry.query_traces(limit=20)
-    final_count = len(final_traces)
+    start_time = time.time()
+    while time.time() - start_time < 30:
+        final_traces = llama_stack_client.telemetry.query_traces(limit=20)
+        final_count = len(final_traces)
+        if final_count > initial_count:
+            break
+        time.sleep(0.1)
 
     # Should have at least as many traces as before (might have more due to other activity)
     assert final_count >= initial_count, "Should have at least as many traces after OpenAI call"
diff --git a/tests/integration/telemetry/test_telemetry.py b/tests/integration/telemetry/test_telemetry.py
index d363edbc0..e86da954e 100644
--- a/tests/integration/telemetry/test_telemetry.py
+++ b/tests/integration/telemetry/test_telemetry.py
@@ -42,14 +42,11 @@ def setup_telemetry_data(llama_stack_client, text_model_id):
         traces = llama_stack_client.telemetry.query_traces(limit=10)
         if len(traces) >= 4:
             break
-        time.sleep(1)
+        time.sleep(0.1)
 
     if len(traces) < 4:
         pytest.fail(f"Failed to create sufficient telemetry data after 30s. Got {len(traces)} traces.")
 
-    # Wait for 5 seconds to ensure traces has completed logging
-    time.sleep(5)
-
     yield
 
 
diff --git a/tests/integration/telemetry/test_telemetry_metrics.py b/tests/integration/telemetry/test_telemetry_metrics.py
index 4ba2bd2d9..1d8312ae2 100644
--- a/tests/integration/telemetry/test_telemetry_metrics.py
+++ b/tests/integration/telemetry/test_telemetry_metrics.py
@@ -46,10 +46,7 @@ def setup_telemetry_metrics_data(openai_client, client_with_models, text_model_i
                 break
         except Exception:
             pass
-        time.sleep(1)
-
-    # Wait additional time to ensure all metrics are processed
-    time.sleep(5)
+        time.sleep(0.1)
 
     # Return the token lists for use in tests
     return {"prompt_tokens": prompt_tokens, "completion_tokens": completion_tokens, "total_tokens": total_tokens}

From c04f1c1e8c0b8c9df80ab51ce7379476cf218317 Mon Sep 17 00:00:00 2001
From: ehhuang <ehhuang@users.noreply.github.com>
Date: Wed, 10 Sep 2025 13:19:44 -0700
Subject: [PATCH 68/76] chore: move benchmarking related code (#3406)

# What does this PR do?
- moving things and some formatting changes


## Test Plan
---
 .../k8s-benchmark/README.md                   |   4 +-
 .../k8s-benchmark/apply.sh                    |   0
 .../k8s-benchmark/benchmark.py                | 129 +++++++------
 .../k8s-benchmark/openai-mock-server.py       | 170 ++++++++++--------
 .../k8s-benchmark/profile_running_server.sh   |   0
 .../k8s-benchmark/run-benchmark.sh            |   0
 .../k8s-benchmark/stack-configmap.yaml        |   0
 .../k8s-benchmark/stack-k8s.yaml.template     |   0
 .../k8s-benchmark/stack_run_config.yaml       |   0
 docs/source/contributing/index.md             |   2 +-
 10 files changed, 156 insertions(+), 149 deletions(-)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/README.md (98%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/apply.sh (100%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/benchmark.py (80%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/openai-mock-server.py (60%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/profile_running_server.sh (100%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/run-benchmark.sh (100%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/stack-configmap.yaml (100%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/stack-k8s.yaml.template (100%)
 rename {docs/source/distributions => benchmarking}/k8s-benchmark/stack_run_config.yaml (100%)

diff --git a/docs/source/distributions/k8s-benchmark/README.md b/benchmarking/k8s-benchmark/README.md
similarity index 98%
rename from docs/source/distributions/k8s-benchmark/README.md
rename to benchmarking/k8s-benchmark/README.md
index 42da4d466..3b0d0c4db 100644
--- a/docs/source/distributions/k8s-benchmark/README.md
+++ b/benchmarking/k8s-benchmark/README.md
@@ -34,13 +34,12 @@ This data enables data-driven architectural decisions and performance optimizati
 
 **1. Deploy base k8s infrastructure:**
 ```bash
-cd ../k8s
+cd ../../docs/source/distributions/k8s
 ./apply.sh
 ```
 
 **2. Deploy benchmark components:**
 ```bash
-cd ../k8s-benchmark
 ./apply.sh
 ```
 
@@ -56,7 +55,6 @@ kubectl get pods
 
 **Benchmark Llama Stack (default):**
 ```bash
-cd docs/source/distributions/k8s-benchmark/
 ./run-benchmark.sh
 ```
 
diff --git a/docs/source/distributions/k8s-benchmark/apply.sh b/benchmarking/k8s-benchmark/apply.sh
similarity index 100%
rename from docs/source/distributions/k8s-benchmark/apply.sh
rename to benchmarking/k8s-benchmark/apply.sh
diff --git a/docs/source/distributions/k8s-benchmark/benchmark.py b/benchmarking/k8s-benchmark/benchmark.py
similarity index 80%
rename from docs/source/distributions/k8s-benchmark/benchmark.py
rename to benchmarking/k8s-benchmark/benchmark.py
index 83ba9602a..d5e34aa23 100644
--- a/docs/source/distributions/k8s-benchmark/benchmark.py
+++ b/benchmarking/k8s-benchmark/benchmark.py
@@ -14,7 +14,7 @@ import os
 import random
 import statistics
 import time
-from typing import Tuple
+
 import aiohttp
 
 
@@ -55,50 +55,50 @@ class BenchmarkStats:
 
         total_time = self.end_time - self.start_time
         success_rate = (self.success_count / self.total_requests) * 100
-        
-        print(f"\n{'='*60}")
-        print(f"BENCHMARK RESULTS")
-        
-        print(f"\nResponse Time Statistics:")
+
+        print(f"\n{'=' * 60}")
+        print("BENCHMARK RESULTS")
+
+        print("\nResponse Time Statistics:")
         print(f"  Mean: {statistics.mean(self.response_times):.3f}s")
         print(f"  Median: {statistics.median(self.response_times):.3f}s")
         print(f"  Min: {min(self.response_times):.3f}s")
         print(f"  Max: {max(self.response_times):.3f}s")
-        
+
         if len(self.response_times) > 1:
             print(f"  Std Dev: {statistics.stdev(self.response_times):.3f}s")
-            
+
         percentiles = [50, 90, 95, 99]
         sorted_times = sorted(self.response_times)
-        print(f"\nPercentiles:")
+        print("\nPercentiles:")
         for p in percentiles:
             idx = int(len(sorted_times) * p / 100) - 1
             idx = max(0, min(idx, len(sorted_times) - 1))
             print(f"  P{p}: {sorted_times[idx]:.3f}s")
-            
+
         if self.ttft_times:
-            print(f"\nTime to First Token (TTFT) Statistics:")
+            print("\nTime to First Token (TTFT) Statistics:")
             print(f"  Mean: {statistics.mean(self.ttft_times):.3f}s")
             print(f"  Median: {statistics.median(self.ttft_times):.3f}s")
             print(f"  Min: {min(self.ttft_times):.3f}s")
             print(f"  Max: {max(self.ttft_times):.3f}s")
-            
+
             if len(self.ttft_times) > 1:
                 print(f"  Std Dev: {statistics.stdev(self.ttft_times):.3f}s")
-                
+
             sorted_ttft = sorted(self.ttft_times)
-            print(f"\nTTFT Percentiles:")
+            print("\nTTFT Percentiles:")
             for p in percentiles:
                 idx = int(len(sorted_ttft) * p / 100) - 1
                 idx = max(0, min(idx, len(sorted_ttft) - 1))
                 print(f"  P{p}: {sorted_ttft[idx]:.3f}s")
-            
+
         if self.chunks_received:
-            print(f"\nStreaming Statistics:")
+            print("\nStreaming Statistics:")
             print(f"  Mean chunks per response: {statistics.mean(self.chunks_received):.1f}")
             print(f"  Total chunks received: {sum(self.chunks_received)}")
-        
-        print(f"{'='*60}")
+
+        print(f"{'=' * 60}")
         print(f"Total time: {total_time:.2f}s")
         print(f"Concurrent users: {self.concurrent_users}")
         print(f"Total requests: {self.total_requests}")
@@ -106,16 +106,16 @@ class BenchmarkStats:
         print(f"Failed requests: {len(self.errors)}")
         print(f"Success rate: {success_rate:.1f}%")
         print(f"Requests per second: {self.success_count / total_time:.2f}")
-        
+
         if self.errors:
-            print(f"\nErrors (showing first 5):")
+            print("\nErrors (showing first 5):")
             for error in self.errors[:5]:
                 print(f"  {error}")
 
 
 class LlamaStackBenchmark:
     def __init__(self, base_url: str, model_id: str):
-        self.base_url = base_url.rstrip('/')
+        self.base_url = base_url.rstrip("/")
         self.model_id = model_id
         self.headers = {"Content-Type": "application/json"}
         self.test_messages = [
@@ -126,74 +126,67 @@ class LlamaStackBenchmark:
             [
                 {"role": "user", "content": "What is machine learning?"},
                 {"role": "assistant", "content": "Machine learning is a subset of AI..."},
-                {"role": "user", "content": "Can you give me a practical example?"}
-            ]
+                {"role": "user", "content": "Can you give me a practical example?"},
+            ],
         ]
 
-
-    async def make_async_streaming_request(self) -> Tuple[float, int, float | None, str | None]:
+    async def make_async_streaming_request(self) -> tuple[float, int, float | None, str | None]:
         """Make a single async streaming chat completion request."""
         messages = random.choice(self.test_messages)
-        payload = {
-            "model": self.model_id,
-            "messages": messages,
-            "stream": True,
-            "max_tokens": 100
-        }
-        
+        payload = {"model": self.model_id, "messages": messages, "stream": True, "max_tokens": 100}
+
         start_time = time.time()
         chunks_received = 0
         ttft = None
         error = None
-        
+
         session = aiohttp.ClientSession()
-        
+
         try:
             async with session.post(
                 f"{self.base_url}/chat/completions",
                 headers=self.headers,
                 json=payload,
-                timeout=aiohttp.ClientTimeout(total=30)
+                timeout=aiohttp.ClientTimeout(total=30),
             ) as response:
                 if response.status == 200:
                     async for line in response.content:
                         if line:
-                            line_str = line.decode('utf-8').strip()
-                            if line_str.startswith('data: '):
+                            line_str = line.decode("utf-8").strip()
+                            if line_str.startswith("data: "):
                                 chunks_received += 1
                                 if ttft is None:
                                     ttft = time.time() - start_time
-                                if line_str == 'data: [DONE]':
+                                if line_str == "data: [DONE]":
                                     break
-                    
+
                     if chunks_received == 0:
                         error = "No streaming chunks received"
                 else:
                     text = await response.text()
                     error = f"HTTP {response.status}: {text[:100]}"
-                    
+
         except Exception as e:
             error = f"Request error: {str(e)}"
         finally:
             await session.close()
-            
+
         response_time = time.time() - start_time
         return response_time, chunks_received, ttft, error
 
-
     async def run_benchmark(self, duration: int, concurrent_users: int) -> BenchmarkStats:
         """Run benchmark using async requests for specified duration."""
         stats = BenchmarkStats()
         stats.concurrent_users = concurrent_users
         stats.start_time = time.time()
-        
+
         print(f"Starting benchmark: {duration}s duration, {concurrent_users} concurrent users")
         print(f"Target URL: {self.base_url}/chat/completions")
         print(f"Model: {self.model_id}")
-        
+
         connector = aiohttp.TCPConnector(limit=concurrent_users)
-        async with aiohttp.ClientSession(connector=connector) as session:
-            
+        async with aiohttp.ClientSession(connector=connector):
+
             async def worker(worker_id: int):
                 """Worker that sends requests sequentially until canceled."""
                 request_count = 0
@@ -202,12 +195,12 @@ class LlamaStackBenchmark:
                         response_time, chunks, ttft, error = await self.make_async_streaming_request()
                         await stats.add_result(response_time, chunks, ttft, error)
                         request_count += 1
-                        
+
                     except asyncio.CancelledError:
                         break
                     except Exception as e:
                         await stats.add_result(0, 0, None, f"Worker {worker_id} error: {str(e)}")
-            
+
             # Progress reporting task
             async def progress_reporter():
                 last_report_time = time.time()
@@ -216,48 +209,52 @@ class LlamaStackBenchmark:
                         await asyncio.sleep(1)  # Report every second
                         if time.time() >= last_report_time + 10:  # Report every 10 seconds
                             elapsed = time.time() - stats.start_time
-                            print(f"Completed: {stats.total_requests} requests in {elapsed:.1f}s, RPS: {stats.total_requests / elapsed:.1f}")
+                            print(
+                                f"Completed: {stats.total_requests} requests in {elapsed:.1f}s, RPS: {stats.total_requests / elapsed:.1f}"
+                            )
                             last_report_time = time.time()
                     except asyncio.CancelledError:
                         break
-            
+
             # Spawn concurrent workers
             tasks = [asyncio.create_task(worker(i)) for i in range(concurrent_users)]
             progress_task = asyncio.create_task(progress_reporter())
             tasks.append(progress_task)
-            
+
             # Wait for duration then cancel all tasks
             await asyncio.sleep(duration)
-            
+
             for task in tasks:
                 task.cancel()
-            
+
             # Wait for all tasks to complete
             await asyncio.gather(*tasks, return_exceptions=True)
-        
+
         stats.end_time = time.time()
         return stats
 
 
 def main():
     parser = argparse.ArgumentParser(description="Llama Stack Benchmark Tool")
-    parser.add_argument("--base-url", default=os.getenv("BENCHMARK_BASE_URL", "http://localhost:8000/v1/openai/v1"),
-                       help="Base URL for the API (default: http://localhost:8000/v1/openai/v1)")
-    parser.add_argument("--model", default=os.getenv("INFERENCE_MODEL", "test-model"),
-                       help="Model ID to use for requests")
-    parser.add_argument("--duration", type=int, default=60,
-                       help="Duration in seconds to run benchmark (default: 60)")
-    parser.add_argument("--concurrent", type=int, default=10,
-                       help="Number of concurrent users (default: 10)")
-    
+    parser.add_argument(
+        "--base-url",
+        default=os.getenv("BENCHMARK_BASE_URL", "http://localhost:8000/v1/openai/v1"),
+        help="Base URL for the API (default: http://localhost:8000/v1/openai/v1)",
+    )
+    parser.add_argument(
+        "--model", default=os.getenv("INFERENCE_MODEL", "test-model"), help="Model ID to use for requests"
+    )
+    parser.add_argument("--duration", type=int, default=60, help="Duration in seconds to run benchmark (default: 60)")
+    parser.add_argument("--concurrent", type=int, default=10, help="Number of concurrent users (default: 10)")
+
     args = parser.parse_args()
-    
+
     benchmark = LlamaStackBenchmark(args.base_url, args.model)
-    
+
     try:
         stats = asyncio.run(benchmark.run_benchmark(args.duration, args.concurrent))
         stats.print_summary()
-        
+
     except KeyboardInterrupt:
         print("\nBenchmark interrupted by user")
     except Exception as e:
diff --git a/docs/source/distributions/k8s-benchmark/openai-mock-server.py b/benchmarking/k8s-benchmark/openai-mock-server.py
similarity index 60%
rename from docs/source/distributions/k8s-benchmark/openai-mock-server.py
rename to benchmarking/k8s-benchmark/openai-mock-server.py
index de0680842..9e898af8e 100755
--- a/docs/source/distributions/k8s-benchmark/openai-mock-server.py
+++ b/benchmarking/k8s-benchmark/openai-mock-server.py
@@ -11,180 +11,192 @@ OpenAI-compatible mock server that returns:
 - Valid OpenAI-formatted chat completion responses with dynamic content
 """
 
-from flask import Flask, request, jsonify, Response
-import time
-import random
-import uuid
-import json
 import argparse
+import json
 import os
+import random
+import time
+import uuid
+
+from flask import Flask, Response, jsonify, request
 
 app = Flask(__name__)
 
+
 # Models from environment variables
 def get_models():
     models_str = os.getenv("MOCK_MODELS", "meta-llama/Llama-3.2-3B-Instruct")
     model_ids = [m.strip() for m in models_str.split(",") if m.strip()]
-    
+
     return {
         "object": "list",
         "data": [
-            {
-                "id": model_id,
-                "object": "model",
-                "created": 1234567890,
-                "owned_by": "vllm"
-            }
-            for model_id in model_ids
-        ]
+            {"id": model_id, "object": "model", "created": 1234567890, "owned_by": "vllm"} for model_id in model_ids
+        ],
     }
 
+
 def generate_random_text(length=50):
     """Generate random but coherent text for responses."""
     words = [
-        "Hello", "there", "I'm", "an", "AI", "assistant", "ready", "to", "help", "you",
-        "with", "your", "questions", "and", "tasks", "today", "Let", "me","know", "what",
-        "you'd", "like", "to", "discuss", "or", "explore", "together", "I", "can", "assist",
-        "with", "various", "topics", "including", "coding", "writing", "analysis", "and", "more"
+        "Hello",
+        "there",
+        "I'm",
+        "an",
+        "AI",
+        "assistant",
+        "ready",
+        "to",
+        "help",
+        "you",
+        "with",
+        "your",
+        "questions",
+        "and",
+        "tasks",
+        "today",
+        "Let",
+        "me",
+        "know",
+        "what",
+        "you'd",
+        "like",
+        "to",
+        "discuss",
+        "or",
+        "explore",
+        "together",
+        "I",
+        "can",
+        "assist",
+        "with",
+        "various",
+        "topics",
+        "including",
+        "coding",
+        "writing",
+        "analysis",
+        "and",
+        "more",
     ]
     return " ".join(random.choices(words, k=length))
 
-@app.route('/v1/models', methods=['GET'])
+
+@app.route("/v1/models", methods=["GET"])
 def list_models():
     models = get_models()
     print(f"[MOCK] Returning models: {[m['id'] for m in models['data']]}")
     return jsonify(models)
 
-@app.route('/v1/chat/completions', methods=['POST'])
+
+@app.route("/v1/chat/completions", methods=["POST"])
 def chat_completions():
     """Return OpenAI-formatted chat completion responses."""
     data = request.get_json()
-    default_model = get_models()['data'][0]['id']
-    model = data.get('model', default_model)
-    messages = data.get('messages', [])
-    stream = data.get('stream', False)
-     
+    default_model = get_models()["data"][0]["id"]
+    model = data.get("model", default_model)
+    messages = data.get("messages", [])
+    stream = data.get("stream", False)
+
     print(f"[MOCK] Chat completion request - model: {model}, stream: {stream}")
-    
+
     if stream:
         return handle_streaming_completion(model, messages)
     else:
         return handle_non_streaming_completion(model, messages)
 
+
 def handle_non_streaming_completion(model, messages):
     response_text = generate_random_text(random.randint(20, 80))
-    
+
     # Calculate realistic token counts
-    prompt_tokens = sum(len(str(msg.get('content', '')).split()) for msg in messages)
+    prompt_tokens = sum(len(str(msg.get("content", "")).split()) for msg in messages)
     completion_tokens = len(response_text.split())
-    
+
     response = {
         "id": f"chatcmpl-{uuid.uuid4().hex[:8]}",
         "object": "chat.completion",
         "created": int(time.time()),
         "model": model,
-        "choices": [
-            {
-                "index": 0,
-                "message": {
-                    "role": "assistant",
-                    "content": response_text
-                },
-                "finish_reason": "stop"
-            }
-        ],
+        "choices": [{"index": 0, "message": {"role": "assistant", "content": response_text}, "finish_reason": "stop"}],
         "usage": {
             "prompt_tokens": prompt_tokens,
             "completion_tokens": completion_tokens,
-            "total_tokens": prompt_tokens + completion_tokens
-        }
+            "total_tokens": prompt_tokens + completion_tokens,
+        },
     }
-    
+
     return jsonify(response)
 
+
 def handle_streaming_completion(model, messages):
     def generate_stream():
         # Generate response text
         full_response = generate_random_text(random.randint(30, 100))
         words = full_response.split()
-        
+
         # Send initial chunk
         initial_chunk = {
             "id": f"chatcmpl-{uuid.uuid4().hex[:8]}",
             "object": "chat.completion.chunk",
             "created": int(time.time()),
             "model": model,
-            "choices": [
-                {
-                    "index": 0,
-                    "delta": {"role": "assistant", "content": ""}
-                }
-            ]
+            "choices": [{"index": 0, "delta": {"role": "assistant", "content": ""}}],
         }
         yield f"data: {json.dumps(initial_chunk)}\n\n"
-        
+
         # Send word by word
         for i, word in enumerate(words):
             chunk = {
                 "id": f"chatcmpl-{uuid.uuid4().hex[:8]}",
-                "object": "chat.completion.chunk", 
+                "object": "chat.completion.chunk",
                 "created": int(time.time()),
                 "model": model,
-                "choices": [
-                    {
-                        "index": 0,
-                        "delta": {"content": f"{word} " if i < len(words) - 1 else word}
-                    }
-                ]
+                "choices": [{"index": 0, "delta": {"content": f"{word} " if i < len(words) - 1 else word}}],
             }
             yield f"data: {json.dumps(chunk)}\n\n"
             # Configurable delay to simulate realistic streaming
             stream_delay = float(os.getenv("STREAM_DELAY_SECONDS", "0.005"))
             time.sleep(stream_delay)
-        
+
         # Send final chunk
         final_chunk = {
             "id": f"chatcmpl-{uuid.uuid4().hex[:8]}",
             "object": "chat.completion.chunk",
             "created": int(time.time()),
             "model": model,
-            "choices": [
-                {
-                    "index": 0,
-                    "delta": {"content": ""},
-                    "finish_reason": "stop"
-                }
-            ]
+            "choices": [{"index": 0, "delta": {"content": ""}, "finish_reason": "stop"}],
         }
         yield f"data: {json.dumps(final_chunk)}\n\n"
         yield "data: [DONE]\n\n"
-    
+
     return Response(
         generate_stream(),
-        mimetype='text/event-stream',
+        mimetype="text/event-stream",
         headers={
-            'Cache-Control': 'no-cache',
-            'Connection': 'keep-alive',
-            'Access-Control-Allow-Origin': '*',
-        }
+            "Cache-Control": "no-cache",
+            "Connection": "keep-alive",
+            "Access-Control-Allow-Origin": "*",
+        },
     )
 
-@app.route('/health', methods=['GET'])
+
+@app.route("/health", methods=["GET"])
 def health():
     return jsonify({"status": "healthy", "type": "openai-mock"})
 
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser(description='OpenAI-compatible mock server')
-    parser.add_argument('--port', type=int, default=8081, 
-                       help='Port to run the server on (default: 8081)')
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="OpenAI-compatible mock server")
+    parser.add_argument("--port", type=int, default=8081, help="Port to run the server on (default: 8081)")
     args = parser.parse_args()
-    
+
     port = args.port
-    
+
     models = get_models()
     print("Starting OpenAI-compatible mock server...")
     print(f"- /models endpoint with: {[m['id'] for m in models['data']]}")
     print("- OpenAI-formatted chat/completion responses with dynamic content")
     print("- Streaming support with valid SSE format")
     print(f"- Listening on: http://0.0.0.0:{port}")
-    app.run(host='0.0.0.0', port=port, debug=False)
+    app.run(host="0.0.0.0", port=port, debug=False)
diff --git a/docs/source/distributions/k8s-benchmark/profile_running_server.sh b/benchmarking/k8s-benchmark/profile_running_server.sh
similarity index 100%
rename from docs/source/distributions/k8s-benchmark/profile_running_server.sh
rename to benchmarking/k8s-benchmark/profile_running_server.sh
diff --git a/docs/source/distributions/k8s-benchmark/run-benchmark.sh b/benchmarking/k8s-benchmark/run-benchmark.sh
similarity index 100%
rename from docs/source/distributions/k8s-benchmark/run-benchmark.sh
rename to benchmarking/k8s-benchmark/run-benchmark.sh
diff --git a/docs/source/distributions/k8s-benchmark/stack-configmap.yaml b/benchmarking/k8s-benchmark/stack-configmap.yaml
similarity index 100%
rename from docs/source/distributions/k8s-benchmark/stack-configmap.yaml
rename to benchmarking/k8s-benchmark/stack-configmap.yaml
diff --git a/docs/source/distributions/k8s-benchmark/stack-k8s.yaml.template b/benchmarking/k8s-benchmark/stack-k8s.yaml.template
similarity index 100%
rename from docs/source/distributions/k8s-benchmark/stack-k8s.yaml.template
rename to benchmarking/k8s-benchmark/stack-k8s.yaml.template
diff --git a/docs/source/distributions/k8s-benchmark/stack_run_config.yaml b/benchmarking/k8s-benchmark/stack_run_config.yaml
similarity index 100%
rename from docs/source/distributions/k8s-benchmark/stack_run_config.yaml
rename to benchmarking/k8s-benchmark/stack_run_config.yaml
diff --git a/docs/source/contributing/index.md b/docs/source/contributing/index.md
index 1846f4d97..71c3bd5a6 100644
--- a/docs/source/contributing/index.md
+++ b/docs/source/contributing/index.md
@@ -35,5 +35,5 @@ testing/record-replay
 
 ### Benchmarking
 
-```{include} ../../../docs/source/distributions/k8s-benchmark/README.md
+```{include} ../../../benchmarking/k8s-benchmark/README.md
 ```

From 0c7f49490cdb6ff757659469d1401b515ac4402c Mon Sep 17 00:00:00 2001
From: Ashwin Bharambe <ashwin.bharambe@gmail.com>
Date: Wed, 10 Sep 2025 14:34:18 -0700
Subject: [PATCH 69/76] fix(inference_store): on duplicate chat completion IDs,
 replace (#3408)

# What does this PR do?

Duplicate chat completion IDs can be generated during tests especially
if they are replaying recorded responses across different tests. No need
to warn or error under those circumstances. In the wild, this is not
likely to happen at all (no evidence) so we aren't really hiding any
problem.
---
 .../utils/inference/inference_store.py        | 48 +++++++++++++++----
 .../utils/sqlstore/authorized_sqlstore.py     | 14 ++++++
 2 files changed, 53 insertions(+), 9 deletions(-)

diff --git a/llama_stack/providers/utils/inference/inference_store.py b/llama_stack/providers/utils/inference/inference_store.py
index 8c69b1683..17f4c6268 100644
--- a/llama_stack/providers/utils/inference/inference_store.py
+++ b/llama_stack/providers/utils/inference/inference_store.py
@@ -6,6 +6,8 @@
 import asyncio
 from typing import Any
 
+from sqlalchemy.exc import IntegrityError
+
 from llama_stack.apis.inference import (
     ListOpenAIChatCompletionResponse,
     OpenAIChatCompletion,
@@ -129,16 +131,44 @@ class InferenceStore:
             raise ValueError("Inference store is not initialized")
 
         data = chat_completion.model_dump()
+        record_data = {
+            "id": data["id"],
+            "created": data["created"],
+            "model": data["model"],
+            "choices": data["choices"],
+            "input_messages": [message.model_dump() for message in input_messages],
+        }
 
-        await self.sql_store.insert(
-            table="chat_completions",
-            data={
-                "id": data["id"],
-                "created": data["created"],
-                "model": data["model"],
-                "choices": data["choices"],
-                "input_messages": [message.model_dump() for message in input_messages],
-            },
+        try:
+            await self.sql_store.insert(
+                table="chat_completions",
+                data=record_data,
+            )
+        except IntegrityError as e:
+            # Duplicate chat completion IDs can be generated during tests especially if they are replaying
+            # recorded responses across different tests. No need to warn or error under those circumstances.
+            # In the wild, this is not likely to happen at all (no evidence) so we aren't really hiding any problem.
+
+            # Check if it's a unique constraint violation
+            error_message = str(e.orig) if e.orig else str(e)
+            if self._is_unique_constraint_error(error_message):
+                # Update the existing record instead
+                await self.sql_store.update(table="chat_completions", data=record_data, where={"id": data["id"]})
+            else:
+                # Re-raise if it's not a unique constraint error
+                raise
+
+    def _is_unique_constraint_error(self, error_message: str) -> bool:
+        """Check if the error is specifically a unique constraint violation."""
+        error_lower = error_message.lower()
+        return any(
+            indicator in error_lower
+            for indicator in [
+                "unique constraint failed",  # SQLite
+                "duplicate key",  # PostgreSQL
+                "unique violation",  # PostgreSQL alternative
+                "duplicate entry",  # MySQL
+            ]
         )
 
     async def list_chat_completions(
diff --git a/llama_stack/providers/utils/sqlstore/authorized_sqlstore.py b/llama_stack/providers/utils/sqlstore/authorized_sqlstore.py
index 867ba2f55..acb688f96 100644
--- a/llama_stack/providers/utils/sqlstore/authorized_sqlstore.py
+++ b/llama_stack/providers/utils/sqlstore/authorized_sqlstore.py
@@ -172,6 +172,20 @@ class AuthorizedSqlStore:
 
         return results.data[0] if results.data else None
 
+    async def update(self, table: str, data: Mapping[str, Any], where: Mapping[str, Any]) -> None:
+        """Update rows with automatic access control attribute capture."""
+        enhanced_data = dict(data)
+
+        current_user = get_authenticated_user()
+        if current_user:
+            enhanced_data["owner_principal"] = current_user.principal
+            enhanced_data["access_attributes"] = current_user.attributes
+        else:
+            enhanced_data["owner_principal"] = None
+            enhanced_data["access_attributes"] = None
+
+        await self.sql_store.update(table, enhanced_data, where)
+
     async def delete(self, table: str, where: Mapping[str, Any]) -> None:
         """Delete rows with automatic access control filtering."""
         await self.sql_store.delete(table, where)

From 8e05c68d159a40d54768a9473d63b68a5bfbf369 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?S=C3=A9bastien=20Han?= <seb@redhat.com>
Date: Thu, 11 Sep 2025 10:19:59 +0200
Subject: [PATCH 70/76] chore: remove openai dependency from providers (#3398)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

# What does this PR do?

The openai package is already a dependency of the llama-stack project
itself, so let's the project dictate which openai version we need and
avoid potential breakage with unsatisfiable dependency resolution.

Signed-off-by: Sébastien Han <seb@redhat.com>
---
 llama_stack/providers/registry/batches.py   |  2 +-
 llama_stack/providers/registry/inference.py | 20 ++++++++------------
 llama_stack/providers/registry/scoring.py   |  2 +-
 pyproject.toml                              |  4 +---
 uv.lock                                     |  8 ++------
 5 files changed, 13 insertions(+), 23 deletions(-)

diff --git a/llama_stack/providers/registry/batches.py b/llama_stack/providers/registry/batches.py
index de7886efb..a07942486 100644
--- a/llama_stack/providers/registry/batches.py
+++ b/llama_stack/providers/registry/batches.py
@@ -13,7 +13,7 @@ def available_providers() -> list[ProviderSpec]:
         InlineProviderSpec(
             api=Api.batches,
             provider_type="inline::reference",
-            pip_packages=["openai"],
+            pip_packages=[],
             module="llama_stack.providers.inline.batches.reference",
             config_class="llama_stack.providers.inline.batches.reference.config.ReferenceBatchesImplConfig",
             api_dependencies=[
diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index 541fbb432..8912560cb 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -75,7 +75,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="vllm",
-                pip_packages=["openai"],
+                pip_packages=[],
                 module="llama_stack.providers.remote.inference.vllm",
                 config_class="llama_stack.providers.remote.inference.vllm.VLLMInferenceAdapterConfig",
                 description="Remote vLLM inference provider for connecting to vLLM servers.",
@@ -151,9 +151,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="databricks",
-                pip_packages=[
-                    "openai",
-                ],
+                pip_packages=[],
                 module="llama_stack.providers.remote.inference.databricks",
                 config_class="llama_stack.providers.remote.inference.databricks.DatabricksImplConfig",
                 description="Databricks inference provider for running models on Databricks' unified analytics platform.",
@@ -163,9 +161,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="nvidia",
-                pip_packages=[
-                    "openai",
-                ],
+                pip_packages=[],
                 module="llama_stack.providers.remote.inference.nvidia",
                 config_class="llama_stack.providers.remote.inference.nvidia.NVIDIAConfig",
                 description="NVIDIA inference provider for accessing NVIDIA NIM models and AI services.",
@@ -175,7 +171,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="runpod",
-                pip_packages=["openai"],
+                pip_packages=[],
                 module="llama_stack.providers.remote.inference.runpod",
                 config_class="llama_stack.providers.remote.inference.runpod.RunpodImplConfig",
                 description="RunPod inference provider for running models on RunPod's cloud GPU platform.",
@@ -207,7 +203,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="gemini",
-                pip_packages=["litellm", "openai"],
+                pip_packages=["litellm"],
                 module="llama_stack.providers.remote.inference.gemini",
                 config_class="llama_stack.providers.remote.inference.gemini.GeminiConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.gemini.config.GeminiProviderDataValidator",
@@ -218,7 +214,7 @@ def available_providers() -> list[ProviderSpec]:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="vertexai",
-                pip_packages=["litellm", "google-cloud-aiplatform", "openai"],
+                pip_packages=["litellm", "google-cloud-aiplatform"],
                 module="llama_stack.providers.remote.inference.vertexai",
                 config_class="llama_stack.providers.remote.inference.vertexai.VertexAIConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.vertexai.config.VertexAIProviderDataValidator",
@@ -248,7 +244,7 @@ Available Models:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="groq",
-                pip_packages=["litellm", "openai"],
+                pip_packages=["litellm"],
                 module="llama_stack.providers.remote.inference.groq",
                 config_class="llama_stack.providers.remote.inference.groq.GroqConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.groq.config.GroqProviderDataValidator",
@@ -270,7 +266,7 @@ Available Models:
             api=Api.inference,
             adapter=AdapterSpec(
                 adapter_type="sambanova",
-                pip_packages=["litellm", "openai"],
+                pip_packages=["litellm"],
                 module="llama_stack.providers.remote.inference.sambanova",
                 config_class="llama_stack.providers.remote.inference.sambanova.SambaNovaImplConfig",
                 provider_data_validator="llama_stack.providers.remote.inference.sambanova.config.SambaNovaProviderDataValidator",
diff --git a/llama_stack/providers/registry/scoring.py b/llama_stack/providers/registry/scoring.py
index 79293d888..a4ec54ed2 100644
--- a/llama_stack/providers/registry/scoring.py
+++ b/llama_stack/providers/registry/scoring.py
@@ -38,7 +38,7 @@ def available_providers() -> list[ProviderSpec]:
         InlineProviderSpec(
             api=Api.scoring,
             provider_type="inline::braintrust",
-            pip_packages=["autoevals", "openai"],
+            pip_packages=["autoevals"],
             module="llama_stack.providers.inline.scoring.braintrust",
             config_class="llama_stack.providers.inline.scoring.braintrust.BraintrustScoringConfig",
             api_dependencies=[
diff --git a/pyproject.toml b/pyproject.toml
index 0414aafb0..72c4f6f9e 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -32,7 +32,7 @@ dependencies = [
     "jinja2>=3.1.6",
     "jsonschema",
     "llama-stack-client>=0.2.21",
-    "openai>=1.99.6",
+    "openai>=1.100.0",                                # for expires_after support
     "prompt-toolkit",
     "python-dotenv",
     "python-jose[cryptography]",
@@ -80,7 +80,6 @@ dev = [
 unit = [
     "sqlite-vec",
     "ollama",
-    "openai",
     "aiosqlite",
     "aiohttp",
     "psycopg2-binary>=2.9.0",
@@ -105,7 +104,6 @@ unit = [
 # separately. If you are using "uv" to execute your tests, you can use the "--group" flag to specify extra
 # dependencies.
 test = [
-    "openai>=1.100.0",  # for expires_after support
     "aiosqlite",
     "aiohttp",
     "torch>=2.6.0",
diff --git a/uv.lock b/uv.lock
index 3d7713f54..065eb3876 100644
--- a/uv.lock
+++ b/uv.lock
@@ -1,5 +1,5 @@
 version = 1
-revision = 3
+revision = 2
 requires-python = ">=3.12"
 resolution-markers = [
     "(python_full_version >= '3.13' and platform_machine != 'aarch64' and sys_platform == 'linux') or (python_full_version >= '3.13' and sys_platform != 'darwin' and sys_platform != 'linux')",
@@ -1839,7 +1839,6 @@ test = [
     { name = "datasets" },
     { name = "mcp" },
     { name = "milvus-lite" },
-    { name = "openai" },
     { name = "psycopg2-binary" },
     { name = "pymilvus" },
     { name = "pypdf" },
@@ -1865,7 +1864,6 @@ unit = [
     { name = "milvus-lite" },
     { name = "moto", extra = ["s3"] },
     { name = "ollama" },
-    { name = "openai" },
     { name = "psycopg2-binary" },
     { name = "pymilvus" },
     { name = "pypdf" },
@@ -1889,7 +1887,7 @@ requires-dist = [
     { name = "jsonschema" },
     { name = "llama-stack-client", specifier = ">=0.2.21" },
     { name = "llama-stack-client", marker = "extra == 'ui'", specifier = ">=0.2.21" },
-    { name = "openai", specifier = ">=1.99.6" },
+    { name = "openai", specifier = ">=1.100.0" },
     { name = "opentelemetry-exporter-otlp-proto-http", specifier = ">=1.30.0" },
     { name = "opentelemetry-sdk", specifier = ">=1.30.0" },
     { name = "pandas", marker = "extra == 'ui'" },
@@ -1959,7 +1957,6 @@ test = [
     { name = "datasets", specifier = ">=4.0.0" },
     { name = "mcp" },
     { name = "milvus-lite", specifier = ">=2.5.0" },
-    { name = "openai", specifier = ">=1.100.0" },
     { name = "psycopg2-binary", specifier = ">=2.9.0" },
     { name = "pymilvus", specifier = ">=2.6.1" },
     { name = "pypdf" },
@@ -1984,7 +1981,6 @@ unit = [
     { name = "milvus-lite", specifier = ">=2.5.0" },
     { name = "moto", extras = ["s3"], specifier = ">=5.1.10" },
     { name = "ollama" },
-    { name = "openai" },
     { name = "psycopg2-binary", specifier = ">=2.9.0" },
     { name = "pymilvus", specifier = ">=2.6.1" },
     { name = "pypdf" },

From 2838d5a20f888c9f8fad666272dd9ca8d3bb4884 Mon Sep 17 00:00:00 2001
From: Sumanth Kamenani <skamenan@redhat.com>
Date: Thu, 11 Sep 2025 05:41:53 -0400
Subject: [PATCH 71/76] fix: AWS Bedrock inference profile ID conversion for
 region-specific endpoints (#3386)

Fixes #3370

AWS switched to requiring region-prefixed inference profile IDs instead
of foundation model IDs for on-demand throughput. This was causing
ValidationException errors.

Added auto-detection based on boto3 client region to convert model IDs
like meta.llama3-1-70b-instruct-v1:0 to
us.meta.llama3-1-70b-instruct-v1:0 depending on the detected region.

Also handles edge cases like ARNs, case insensitive regions, and None
regions.

Tested with this request.
```json
{
  "model_id": "meta.llama3-1-8b-instruct-v1:0",
  "messages": [
    {
      "role": "system",
      "content": "You are a helpful assistant."
    },
    {
      "role": "user",
      "content": "tell me a riddle"
    }
  ],
  "sampling_params": {
     "strategy": {
        "type": "top_p",
        "temperature": 0.7,
        "top_p": 0.9
      },
      "max_tokens": 512
  }
}
```
<img width="1488" height="878" alt="image"
src="https://github.com/user-attachments/assets/0d61beec-3869-4a31-8f37-9f554c280b88"
/>
---
 .../remote/inference/bedrock/bedrock.py       | 51 +++++++++++++++++-
 tests/unit/providers/test_bedrock.py          | 53 +++++++++++++++++++
 2 files changed, 102 insertions(+), 2 deletions(-)
 create mode 100644 tests/unit/providers/test_bedrock.py

diff --git a/llama_stack/providers/remote/inference/bedrock/bedrock.py b/llama_stack/providers/remote/inference/bedrock/bedrock.py
index 63ea196f6..106caed9b 100644
--- a/llama_stack/providers/remote/inference/bedrock/bedrock.py
+++ b/llama_stack/providers/remote/inference/bedrock/bedrock.py
@@ -53,6 +53,43 @@ from llama_stack.providers.utils.inference.prompt_adapter import (
 
 from .models import MODEL_ENTRIES
 
+REGION_PREFIX_MAP = {
+    "us": "us.",
+    "eu": "eu.",
+    "ap": "ap.",
+}
+
+
+def _get_region_prefix(region: str | None) -> str:
+    # AWS requires region prefixes for inference profiles
+    if region is None:
+        return "us."  # default to US when we don't know
+
+    # Handle case insensitive region matching
+    region_lower = region.lower()
+    for prefix in REGION_PREFIX_MAP:
+        if region_lower.startswith(f"{prefix}-"):
+            return REGION_PREFIX_MAP[prefix]
+
+    # Fallback to US for anything we don't recognize
+    return "us."
+
+
+def _to_inference_profile_id(model_id: str, region: str = None) -> str:
+    # Return ARNs unchanged
+    if model_id.startswith("arn:"):
+        return model_id
+
+    # Return inference profile IDs that already have regional prefixes
+    if any(model_id.startswith(p) for p in REGION_PREFIX_MAP.values()):
+        return model_id
+
+    # Default to US East when no region is provided
+    if region is None:
+        region = "us-east-1"
+
+    return _get_region_prefix(region) + model_id
+
 
 class BedrockInferenceAdapter(
     ModelRegistryHelper,
@@ -166,8 +203,13 @@ class BedrockInferenceAdapter(
             options["repetition_penalty"] = sampling_params.repetition_penalty
 
         prompt = await chat_completion_request_to_prompt(request, self.get_llama_model(request.model))
+
+        # Convert foundation model ID to inference profile ID
+        region_name = self.client.meta.region_name
+        inference_profile_id = _to_inference_profile_id(bedrock_model, region_name)
+
         return {
-            "modelId": bedrock_model,
+            "modelId": inference_profile_id,
             "body": json.dumps(
                 {
                     "prompt": prompt,
@@ -185,6 +227,11 @@ class BedrockInferenceAdapter(
         task_type: EmbeddingTaskType | None = None,
     ) -> EmbeddingsResponse:
         model = await self.model_store.get_model(model_id)
+
+        # Convert foundation model ID to inference profile ID
+        region_name = self.client.meta.region_name
+        inference_profile_id = _to_inference_profile_id(model.provider_resource_id, region_name)
+
         embeddings = []
         for content in contents:
             assert not content_has_media(content), "Bedrock does not support media for embeddings"
@@ -193,7 +240,7 @@ class BedrockInferenceAdapter(
             body = json.dumps(input_body)
             response = self.client.invoke_model(
                 body=body,
-                modelId=model.provider_resource_id,
+                modelId=inference_profile_id,
                 accept="application/json",
                 contentType="application/json",
             )
diff --git a/tests/unit/providers/test_bedrock.py b/tests/unit/providers/test_bedrock.py
new file mode 100644
index 000000000..1ff07bbbe
--- /dev/null
+++ b/tests/unit/providers/test_bedrock.py
@@ -0,0 +1,53 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+from llama_stack.providers.remote.inference.bedrock.bedrock import (
+    _get_region_prefix,
+    _to_inference_profile_id,
+)
+
+
+def test_region_prefixes():
+    assert _get_region_prefix("us-east-1") == "us."
+    assert _get_region_prefix("eu-west-1") == "eu."
+    assert _get_region_prefix("ap-south-1") == "ap."
+    assert _get_region_prefix("ca-central-1") == "us."
+
+    # Test case insensitive
+    assert _get_region_prefix("US-EAST-1") == "us."
+    assert _get_region_prefix("EU-WEST-1") == "eu."
+    assert _get_region_prefix("Ap-South-1") == "ap."
+
+    # Test None region
+    assert _get_region_prefix(None) == "us."
+
+
+def test_model_id_conversion():
+    # Basic conversion
+    assert (
+        _to_inference_profile_id("meta.llama3-1-70b-instruct-v1:0", "us-east-1") == "us.meta.llama3-1-70b-instruct-v1:0"
+    )
+
+    # Already has prefix
+    assert (
+        _to_inference_profile_id("us.meta.llama3-1-70b-instruct-v1:0", "us-east-1")
+        == "us.meta.llama3-1-70b-instruct-v1:0"
+    )
+
+    # ARN should be returned unchanged
+    arn = "arn:aws:bedrock:us-east-1:123456789012:inference-profile/us.meta.llama3-1-70b-instruct-v1:0"
+    assert _to_inference_profile_id(arn, "us-east-1") == arn
+
+    # ARN should be returned unchanged even without region
+    assert _to_inference_profile_id(arn) == arn
+
+    # Optional region parameter defaults to us-east-1
+    assert _to_inference_profile_id("meta.llama3-1-70b-instruct-v1:0") == "us.meta.llama3-1-70b-instruct-v1:0"
+
+    # Different regions work with optional parameter
+    assert (
+        _to_inference_profile_id("meta.llama3-1-70b-instruct-v1:0", "eu-west-1") == "eu.meta.llama3-1-70b-instruct-v1:0"
+    )

From c2d281e01b360ba0a2db177b90df6e7ba4df8501 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Thu, 11 Sep 2025 07:48:19 -0400
Subject: [PATCH 72/76] chore(replay): improve replay robustness with
 un-validated construction (#3414)

# What does this PR do?

some providers do not produce spec compliant outputs. when this happens
the replay infra will fail to construct the proper types and will return
a dict to the client. the client likely does not expect a dict.

this was discovered with tgi, which returns finish_reason="" when valid
values are "stop", "length" or "content_filter"

## Test Plan

ci
---
 llama_stack/testing/inference_recorder.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/llama_stack/testing/inference_recorder.py b/llama_stack/testing/inference_recorder.py
index 298758c92..e78f493a6 100644
--- a/llama_stack/testing/inference_recorder.py
+++ b/llama_stack/testing/inference_recorder.py
@@ -105,8 +105,12 @@ def _deserialize_response(data: dict[str, Any]) -> Any:
 
             return cls.model_validate(data["__data__"])
         except (ImportError, AttributeError, TypeError, ValueError) as e:
-            logger.warning(f"Failed to deserialize object of type {data['__type__']}: {e}")
-            return data["__data__"]
+            logger.warning(f"Failed to deserialize object of type {data['__type__']} with model_validate: {e}")
+            try:
+                return cls.model_construct(**data["__data__"])
+            except Exception as e:
+                logger.warning(f"Failed to deserialize object of type {data['__type__']} with model_construct: {e}")
+                return data["__data__"]
 
     return data
 

From f31bcc11bc9e4a88ce82dadafea8d4b0cb5f7230 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?S=C3=A9bastien=20Han?= <seb@redhat.com>
Date: Thu, 11 Sep 2025 13:48:38 +0200
Subject: [PATCH 73/76] feat: add Azure OpenAI inference provider support
 (#3396)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

# What does this PR do?

Llama-stack now supports a new OpenAI compatible endpoint with Azure
OpenAI. The starter distro has been updated to add the new remote
inference provider.

A few tests have been modified and improved.

## Test Plan

Deploy a model in the Aure portal then:

```
$ AZURE_API_KEY=... AZURE_API_BASE=... uv run llama stack build --image-type venv --providers inference=remote::azure --run
...
$ LLAMA_STACK_CONFIG=http://localhost:8321 uv run --group test pytest -v -ra --text-model azure/gpt-4.1 tests/integration/inference/test_openai_completion.py
...

Results:

```
============================================= test session starts
============================================== platform darwin -- Python
3.12.8, pytest-8.4.1, pluggy-1.6.0 --
/Users/leseb/Documents/AI/llama-stack/.venv/bin/python3 cachedir:
.pytest_cache
metadata: {'Python': '3.12.8', 'Platform':
'macOS-15.6.1-arm64-arm-64bit', 'Packages': {'pytest': '8.4.1',
'pluggy': '1.6.0'}, 'Plugins': {'anyio': '4.9.0', 'html': '4.1.1',
'socket': '0.7.0', 'asyncio': '1.1.0', 'json-report': '1.5.0',
'timeout': '2.4.0', 'metadata': '3.1.1', 'cov': '6.2.1', 'nbval':
'0.11.0', 'hydra-core': '1.3.2'}} rootdir:
/Users/leseb/Documents/AI/llama-stack
configfile: pyproject.toml
plugins: anyio-4.9.0, html-4.1.1, socket-0.7.0, asyncio-1.1.0,
json-report-1.5.0, timeout-2.4.0, metadata-3.1.1, cov-6.2.1,
nbval-0.11.0, hydra-core-1.3.2 asyncio: mode=Mode.AUTO,
asyncio_default_fixture_loop_scope=None,
asyncio_default_test_loop_scope=function collected 27 items


tests/integration/inference/test_openai_completion.py::test_openai_completion_non_streaming[txt=azure/gpt-5-mini-inference:completion:sanity]
SKIPPED [ 3%]
tests/integration/inference/test_openai_completion.py::test_openai_completion_non_streaming_suffix[txt=azure/gpt-5-mini-inference:completion:suffix]
SKIPPED [ 7%]
tests/integration/inference/test_openai_completion.py::test_openai_completion_streaming[txt=azure/gpt-5-mini-inference:completion:sanity]
SKIPPED [ 11%]
tests/integration/inference/test_openai_completion.py::test_openai_completion_prompt_logprobs[txt=azure/gpt-5-mini-1]
SKIPPED [ 14%]
tests/integration/inference/test_openai_completion.py::test_openai_completion_guided_choice[txt=azure/gpt-5-mini]
SKIPPED [ 18%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[openai_client-txt=azure/gpt-5-mini-inference:chat_completion:non_streaming_01]
PASSED [ 22%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[openai_client-txt=azure/gpt-5-mini-inference:chat_completion:streaming_01]
PASSED [ 25%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[openai_client-txt=azure/gpt-5-mini-inference:chat_completion:streaming_01]
PASSED [ 29%]
tests/integration/inference/test_openai_completion.py::test_inference_store[openai_client-txt=azure/gpt-5-mini-True]
PASSED [ 33%]
tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=azure/gpt-5-mini-True]
PASSED [ 37%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming_with_file[txt=azure/gpt-5-mini]
SKIPPEDed files.) [ 40%]
tests/integration/inference/test_openai_completion.py::test_openai_completion_prompt_logprobs[txt=azure/gpt-5-mini-0]
SKIPPED [ 44%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[openai_client-txt=azure/gpt-5-mini-inference:chat_completion:non_streaming_02]
PASSED [ 48%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[openai_client-txt=azure/gpt-5-mini-inference:chat_completion:streaming_02]
PASSED [ 51%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[openai_client-txt=azure/gpt-5-mini-inference:chat_completion:streaming_02]
PASSED [ 55%]
tests/integration/inference/test_openai_completion.py::test_inference_store[openai_client-txt=azure/gpt-5-mini-False]
PASSED [ 59%]
tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[openai_client-txt=azure/gpt-5-mini-False]
PASSED [ 62%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=azure/gpt-5-mini-inference:chat_completion:non_streaming_01]
PASSED [ 66%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[client_with_models-txt=azure/gpt-5-mini-inference:chat_completion:streaming_01]
PASSED [ 70%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[client_with_models-txt=azure/gpt-5-mini-inference:chat_completion:streaming_01]
PASSED [ 74%]
tests/integration/inference/test_openai_completion.py::test_inference_store[client_with_models-txt=azure/gpt-5-mini-True]
PASSED [ 77%]
tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=azure/gpt-5-mini-True]
PASSED [ 81%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=azure/gpt-5-mini-inference:chat_completion:non_streaming_02]
PASSED [ 85%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[client_with_models-txt=azure/gpt-5-mini-inference:chat_completion:streaming_02]
PASSED [ 88%]
tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[client_with_models-txt=azure/gpt-5-mini-inference:chat_completion:streaming_02]
PASSED [ 92%]
tests/integration/inference/test_openai_completion.py::test_inference_store[client_with_models-txt=azure/gpt-5-mini-False]
PASSED [ 96%]
tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=azure/gpt-5-mini-False]
PASSED [100%]

=========================================== short test summary info
============================================ SKIPPED [3]
tests/integration/inference/test_openai_completion.py:63: Model
azure/gpt-5-mini hosted by remote::azure doesn't support OpenAI
completions. SKIPPED [3]
tests/integration/inference/test_openai_completion.py:118: Model
azure/gpt-5-mini hosted by remote::azure doesn't support vllm extra_body
parameters. SKIPPED [1]
tests/integration/inference/test_openai_completion.py:124: Model
azure/gpt-5-mini hosted by remote::azure doesn't support chat completion
calls with base64 encoded files. ================================== 20
passed, 7 skipped, 2 warnings in 51.77s
==================================
```

Signed-off-by: Sébastien Han <seb@redhat.com>
---
 docs/source/providers/inference/index.md      |    1 +
 .../providers/inference/remote_azure.md       |   29 +
 llama_stack/distributions/ci-tests/build.yaml |    1 +
 llama_stack/distributions/ci-tests/run.yaml   |    7 +
 .../distributions/starter-gpu/build.yaml      |    1 +
 .../distributions/starter-gpu/run.yaml        |    7 +
 llama_stack/distributions/starter/build.yaml  |    1 +
 llama_stack/distributions/starter/run.yaml    |    7 +
 llama_stack/distributions/starter/starter.py  |   18 +
 llama_stack/providers/registry/inference.py   |   15 +
 .../remote/inference/azure/__init__.py        |   15 +
 .../providers/remote/inference/azure/azure.py |   64 +
 .../remote/inference/azure/config.py          |   63 +
 .../remote/inference/azure/models.py          |   28 +
 .../inference/test_openai_completion.py       |   53 +-
 .../inference/test_text_inference.py          |    3 +-
 .../recordings/responses/0fda25b9241c.json    |   71 +
 .../recordings/responses/2b2ad549510d.json    |  448 ++++
 .../recordings/responses/57b67d1b1a36.json    |   71 +
 .../recordings/responses/8752115f8d0c.json    |   71 +
 .../recordings/responses/94d11daee205.json    | 1178 +++++++++
 .../recordings/responses/9f3d749cc1c8.json    | 1150 +++++++++
 .../recordings/responses/c791119e6359.json    |   98 +
 .../recordings/responses/d3e27b7234e2.json    | 2150 +++++++++++++++++
 .../recordings/responses/fb785db7fafd.json    |  310 +++
 .../recordings/responses/ff3271401fb4.json    |  556 +++++
 26 files changed, 6403 insertions(+), 13 deletions(-)
 create mode 100644 docs/source/providers/inference/remote_azure.md
 create mode 100644 llama_stack/providers/remote/inference/azure/__init__.py
 create mode 100644 llama_stack/providers/remote/inference/azure/azure.py
 create mode 100644 llama_stack/providers/remote/inference/azure/config.py
 create mode 100644 llama_stack/providers/remote/inference/azure/models.py
 create mode 100644 tests/integration/recordings/responses/0fda25b9241c.json
 create mode 100644 tests/integration/recordings/responses/2b2ad549510d.json
 create mode 100644 tests/integration/recordings/responses/57b67d1b1a36.json
 create mode 100644 tests/integration/recordings/responses/8752115f8d0c.json
 create mode 100644 tests/integration/recordings/responses/94d11daee205.json
 create mode 100644 tests/integration/recordings/responses/9f3d749cc1c8.json
 create mode 100644 tests/integration/recordings/responses/c791119e6359.json
 create mode 100644 tests/integration/recordings/responses/d3e27b7234e2.json
 create mode 100644 tests/integration/recordings/responses/fb785db7fafd.json
 create mode 100644 tests/integration/recordings/responses/ff3271401fb4.json

diff --git a/docs/source/providers/inference/index.md b/docs/source/providers/inference/index.md
index b6d215474..c5720daef 100644
--- a/docs/source/providers/inference/index.md
+++ b/docs/source/providers/inference/index.md
@@ -18,6 +18,7 @@ This section contains documentation for all available providers for the **infere
 inline_meta-reference
 inline_sentence-transformers
 remote_anthropic
+remote_azure
 remote_bedrock
 remote_cerebras
 remote_databricks
diff --git a/docs/source/providers/inference/remote_azure.md b/docs/source/providers/inference/remote_azure.md
new file mode 100644
index 000000000..19f8f418b
--- /dev/null
+++ b/docs/source/providers/inference/remote_azure.md
@@ -0,0 +1,29 @@
+# remote::azure
+
+## Description
+
+
+Azure OpenAI inference provider for accessing GPT models and other Azure services.
+Provider documentation
+https://learn.microsoft.com/en-us/azure/ai-foundry/openai/overview
+
+
+## Configuration
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `api_key` | `<class 'pydantic.types.SecretStr'>` | No |  | Azure API key for Azure |
+| `api_base` | `<class 'pydantic.networks.HttpUrl'>` | No |  | Azure API base for Azure (e.g., https://your-resource-name.openai.azure.com) |
+| `api_version` | `str \| None` | No |  | Azure API version for Azure (e.g., 2024-12-01-preview) |
+| `api_type` | `str \| None` | No | azure | Azure API type for Azure (e.g., azure) |
+
+## Sample Configuration
+
+```yaml
+api_key: ${env.AZURE_API_KEY:=}
+api_base: ${env.AZURE_API_BASE:=}
+api_version: ${env.AZURE_API_VERSION:=}
+api_type: ${env.AZURE_API_TYPE:=}
+
+```
+
diff --git a/llama_stack/distributions/ci-tests/build.yaml b/llama_stack/distributions/ci-tests/build.yaml
index 8e6c0bf67..a4d920cd6 100644
--- a/llama_stack/distributions/ci-tests/build.yaml
+++ b/llama_stack/distributions/ci-tests/build.yaml
@@ -17,6 +17,7 @@ distribution_spec:
     - provider_type: remote::vertexai
     - provider_type: remote::groq
     - provider_type: remote::sambanova
+    - provider_type: remote::azure
     - provider_type: inline::sentence-transformers
     vector_io:
     - provider_type: inline::faiss
diff --git a/llama_stack/distributions/ci-tests/run.yaml b/llama_stack/distributions/ci-tests/run.yaml
index 26a677c7a..a478a3872 100644
--- a/llama_stack/distributions/ci-tests/run.yaml
+++ b/llama_stack/distributions/ci-tests/run.yaml
@@ -81,6 +81,13 @@ providers:
     config:
       url: https://api.sambanova.ai/v1
       api_key: ${env.SAMBANOVA_API_KEY:=}
+  - provider_id: ${env.AZURE_API_KEY:+azure}
+    provider_type: remote::azure
+    config:
+      api_key: ${env.AZURE_API_KEY:=}
+      api_base: ${env.AZURE_API_BASE:=}
+      api_version: ${env.AZURE_API_VERSION:=}
+      api_type: ${env.AZURE_API_TYPE:=}
   - provider_id: sentence-transformers
     provider_type: inline::sentence-transformers
   vector_io:
diff --git a/llama_stack/distributions/starter-gpu/build.yaml b/llama_stack/distributions/starter-gpu/build.yaml
index ff7c58e6f..05a2bf180 100644
--- a/llama_stack/distributions/starter-gpu/build.yaml
+++ b/llama_stack/distributions/starter-gpu/build.yaml
@@ -18,6 +18,7 @@ distribution_spec:
     - provider_type: remote::vertexai
     - provider_type: remote::groq
     - provider_type: remote::sambanova
+    - provider_type: remote::azure
     - provider_type: inline::sentence-transformers
     vector_io:
     - provider_type: inline::faiss
diff --git a/llama_stack/distributions/starter-gpu/run.yaml b/llama_stack/distributions/starter-gpu/run.yaml
index 5d9dfcb27..786506706 100644
--- a/llama_stack/distributions/starter-gpu/run.yaml
+++ b/llama_stack/distributions/starter-gpu/run.yaml
@@ -81,6 +81,13 @@ providers:
     config:
       url: https://api.sambanova.ai/v1
       api_key: ${env.SAMBANOVA_API_KEY:=}
+  - provider_id: ${env.AZURE_API_KEY:+azure}
+    provider_type: remote::azure
+    config:
+      api_key: ${env.AZURE_API_KEY:=}
+      api_base: ${env.AZURE_API_BASE:=}
+      api_version: ${env.AZURE_API_VERSION:=}
+      api_type: ${env.AZURE_API_TYPE:=}
   - provider_id: sentence-transformers
     provider_type: inline::sentence-transformers
   vector_io:
diff --git a/llama_stack/distributions/starter/build.yaml b/llama_stack/distributions/starter/build.yaml
index e84e528da..2f0cd24fd 100644
--- a/llama_stack/distributions/starter/build.yaml
+++ b/llama_stack/distributions/starter/build.yaml
@@ -18,6 +18,7 @@ distribution_spec:
     - provider_type: remote::vertexai
     - provider_type: remote::groq
     - provider_type: remote::sambanova
+    - provider_type: remote::azure
     - provider_type: inline::sentence-transformers
     vector_io:
     - provider_type: inline::faiss
diff --git a/llama_stack/distributions/starter/run.yaml b/llama_stack/distributions/starter/run.yaml
index a3962b8aa..2814b2ced 100644
--- a/llama_stack/distributions/starter/run.yaml
+++ b/llama_stack/distributions/starter/run.yaml
@@ -81,6 +81,13 @@ providers:
     config:
       url: https://api.sambanova.ai/v1
       api_key: ${env.SAMBANOVA_API_KEY:=}
+  - provider_id: ${env.AZURE_API_KEY:+azure}
+    provider_type: remote::azure
+    config:
+      api_key: ${env.AZURE_API_KEY:=}
+      api_base: ${env.AZURE_API_BASE:=}
+      api_version: ${env.AZURE_API_VERSION:=}
+      api_type: ${env.AZURE_API_TYPE:=}
   - provider_id: sentence-transformers
     provider_type: inline::sentence-transformers
   vector_io:
diff --git a/llama_stack/distributions/starter/starter.py b/llama_stack/distributions/starter/starter.py
index 2fca52700..c2dfe95ad 100644
--- a/llama_stack/distributions/starter/starter.py
+++ b/llama_stack/distributions/starter/starter.py
@@ -59,6 +59,7 @@ ENABLED_INFERENCE_PROVIDERS = [
     "cerebras",
     "nvidia",
     "bedrock",
+    "azure",
 ]
 
 INFERENCE_PROVIDER_IDS = {
@@ -68,6 +69,7 @@ INFERENCE_PROVIDER_IDS = {
     "cerebras": "${env.CEREBRAS_API_KEY:+cerebras}",
     "nvidia": "${env.NVIDIA_API_KEY:+nvidia}",
     "vertexai": "${env.VERTEX_AI_PROJECT:+vertexai}",
+    "azure": "${env.AZURE_API_KEY:+azure}",
 }
 
 
@@ -277,5 +279,21 @@ def get_distribution_template(name: str = "starter") -> DistributionTemplate:
                 "http://localhost:11434",
                 "Ollama URL",
             ),
+            "AZURE_API_KEY": (
+                "",
+                "Azure API Key",
+            ),
+            "AZURE_API_BASE": (
+                "",
+                "Azure API Base",
+            ),
+            "AZURE_API_VERSION": (
+                "",
+                "Azure API Version",
+            ),
+            "AZURE_API_TYPE": (
+                "azure",
+                "Azure API Type",
+            ),
         },
     )
diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py
index 8912560cb..64196152b 100644
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@@ -295,4 +295,19 @@ Available Models:
                 description="IBM WatsonX inference provider for accessing AI models on IBM's WatsonX platform.",
             ),
         ),
+        remote_provider_spec(
+            api=Api.inference,
+            adapter=AdapterSpec(
+                adapter_type="azure",
+                pip_packages=["litellm"],
+                module="llama_stack.providers.remote.inference.azure",
+                config_class="llama_stack.providers.remote.inference.azure.AzureConfig",
+                provider_data_validator="llama_stack.providers.remote.inference.azure.config.AzureProviderDataValidator",
+                description="""
+Azure OpenAI inference provider for accessing GPT models and other Azure services.
+Provider documentation
+https://learn.microsoft.com/en-us/azure/ai-foundry/openai/overview
+""",
+            ),
+        ),
     ]
diff --git a/llama_stack/providers/remote/inference/azure/__init__.py b/llama_stack/providers/remote/inference/azure/__init__.py
new file mode 100644
index 000000000..87bcaf309
--- /dev/null
+++ b/llama_stack/providers/remote/inference/azure/__init__.py
@@ -0,0 +1,15 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+from .config import AzureConfig
+
+
+async def get_adapter_impl(config: AzureConfig, _deps):
+    from .azure import AzureInferenceAdapter
+
+    impl = AzureInferenceAdapter(config)
+    await impl.initialize()
+    return impl
diff --git a/llama_stack/providers/remote/inference/azure/azure.py b/llama_stack/providers/remote/inference/azure/azure.py
new file mode 100644
index 000000000..449bbbb1c
--- /dev/null
+++ b/llama_stack/providers/remote/inference/azure/azure.py
@@ -0,0 +1,64 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+from typing import Any
+from urllib.parse import urljoin
+
+from llama_stack.apis.inference import ChatCompletionRequest
+from llama_stack.providers.utils.inference.litellm_openai_mixin import (
+    LiteLLMOpenAIMixin,
+)
+from llama_stack.providers.utils.inference.openai_mixin import OpenAIMixin
+
+from .config import AzureConfig
+from .models import MODEL_ENTRIES
+
+
+class AzureInferenceAdapter(OpenAIMixin, LiteLLMOpenAIMixin):
+    def __init__(self, config: AzureConfig) -> None:
+        LiteLLMOpenAIMixin.__init__(
+            self,
+            MODEL_ENTRIES,
+            litellm_provider_name="azure",
+            api_key_from_config=config.api_key.get_secret_value(),
+            provider_data_api_key_field="azure_api_key",
+            openai_compat_api_base=str(config.api_base),
+        )
+        self.config = config
+
+    # Delegate the client data handling get_api_key method to LiteLLMOpenAIMixin
+    get_api_key = LiteLLMOpenAIMixin.get_api_key
+
+    def get_base_url(self) -> str:
+        """
+        Get the Azure API base URL.
+
+        Returns the Azure API base URL from the configuration.
+        """
+        return urljoin(str(self.config.api_base), "/openai/v1")
+
+    async def _get_params(self, request: ChatCompletionRequest) -> dict[str, Any]:
+        # Get base parameters from parent
+        params = await super()._get_params(request)
+
+        # Add Azure specific parameters
+        provider_data = self.get_request_provider_data()
+        if provider_data:
+            if getattr(provider_data, "azure_api_key", None):
+                params["api_key"] = provider_data.azure_api_key
+            if getattr(provider_data, "azure_api_base", None):
+                params["api_base"] = provider_data.azure_api_base
+            if getattr(provider_data, "azure_api_version", None):
+                params["api_version"] = provider_data.azure_api_version
+            if getattr(provider_data, "azure_api_type", None):
+                params["api_type"] = provider_data.azure_api_type
+        else:
+            params["api_key"] = self.config.api_key.get_secret_value()
+            params["api_base"] = str(self.config.api_base)
+            params["api_version"] = self.config.api_version
+            params["api_type"] = self.config.api_type
+
+        return params
diff --git a/llama_stack/providers/remote/inference/azure/config.py b/llama_stack/providers/remote/inference/azure/config.py
new file mode 100644
index 000000000..fe9d61d53
--- /dev/null
+++ b/llama_stack/providers/remote/inference/azure/config.py
@@ -0,0 +1,63 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+import os
+from typing import Any
+
+from pydantic import BaseModel, Field, HttpUrl, SecretStr
+
+from llama_stack.schema_utils import json_schema_type
+
+
+class AzureProviderDataValidator(BaseModel):
+    azure_api_key: SecretStr = Field(
+        description="Azure API key for Azure",
+    )
+    azure_api_base: HttpUrl = Field(
+        description="Azure API base for Azure (e.g., https://your-resource-name.openai.azure.com)",
+    )
+    azure_api_version: str | None = Field(
+        default=None,
+        description="Azure API version for Azure (e.g., 2024-06-01)",
+    )
+    azure_api_type: str | None = Field(
+        default="azure",
+        description="Azure API type for Azure (e.g., azure)",
+    )
+
+
+@json_schema_type
+class AzureConfig(BaseModel):
+    api_key: SecretStr = Field(
+        description="Azure API key for Azure",
+    )
+    api_base: HttpUrl = Field(
+        description="Azure API base for Azure (e.g., https://your-resource-name.openai.azure.com)",
+    )
+    api_version: str | None = Field(
+        default_factory=lambda: os.getenv("AZURE_API_VERSION"),
+        description="Azure API version for Azure (e.g., 2024-12-01-preview)",
+    )
+    api_type: str | None = Field(
+        default_factory=lambda: os.getenv("AZURE_API_TYPE", "azure"),
+        description="Azure API type for Azure (e.g., azure)",
+    )
+
+    @classmethod
+    def sample_run_config(
+        cls,
+        api_key: str = "${env.AZURE_API_KEY:=}",
+        api_base: str = "${env.AZURE_API_BASE:=}",
+        api_version: str = "${env.AZURE_API_VERSION:=}",
+        api_type: str = "${env.AZURE_API_TYPE:=}",
+        **kwargs,
+    ) -> dict[str, Any]:
+        return {
+            "api_key": api_key,
+            "api_base": api_base,
+            "api_version": api_version,
+            "api_type": api_type,
+        }
diff --git a/llama_stack/providers/remote/inference/azure/models.py b/llama_stack/providers/remote/inference/azure/models.py
new file mode 100644
index 000000000..64c87969b
--- /dev/null
+++ b/llama_stack/providers/remote/inference/azure/models.py
@@ -0,0 +1,28 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+from llama_stack.providers.utils.inference.model_registry import (
+    ProviderModelEntry,
+)
+
+# https://learn.microsoft.com/en-us/azure/ai-foundry/openai/concepts/models?tabs=global-standard%2Cstandard-chat-completions
+LLM_MODEL_IDS = [
+    "gpt-5",
+    "gpt-5-mini",
+    "gpt-5-nano",
+    "gpt-5-chat",
+    "o1",
+    "o1-mini",
+    "o3-mini",
+    "o4-mini",
+    "gpt-4.1",
+    "gpt-4.1-mini",
+    "gpt-4.1-nano",
+]
+
+SAFETY_MODELS_ENTRIES = list[ProviderModelEntry]()
+
+MODEL_ENTRIES = [ProviderModelEntry(provider_model_id=m) for m in LLM_MODEL_IDS] + SAFETY_MODELS_ENTRIES
diff --git a/tests/integration/inference/test_openai_completion.py b/tests/integration/inference/test_openai_completion.py
index f9c837ebd..22dec8876 100644
--- a/tests/integration/inference/test_openai_completion.py
+++ b/tests/integration/inference/test_openai_completion.py
@@ -6,12 +6,25 @@
 
 
 import time
+import unicodedata
 
 import pytest
 
 from ..test_cases.test_case import TestCase
 
 
+def _normalize_text(text: str) -> str:
+    """
+    Normalize Unicode text by removing diacritical marks for comparison.
+
+    The test case streaming_01 expects the answer "Sol" for the question "What's the name of the Sun
+    in latin?", but the model is returning "sōl" (with a macron over the 'o'), which is the correct
+    Latin spelling. The test is failing because it's doing a simple case-insensitive string search
+    for "sol" but the actual response contains the diacritical mark.
+    """
+    return unicodedata.normalize("NFD", text).encode("ascii", "ignore").decode("ascii").lower()
+
+
 def provider_from_model(client_with_models, model_id):
     models = {m.identifier: m for m in client_with_models.models.list()}
     models.update({m.provider_resource_id: m for m in client_with_models.models.list()})
@@ -42,6 +55,10 @@ def skip_if_model_doesnt_support_openai_completion(client_with_models, model_id)
         "remote::groq",
         "remote::gemini",  # https://generativelanguage.googleapis.com/v1beta/openai/completions -> 404
         "remote::anthropic",  # at least claude-3-{5,7}-{haiku,sonnet}-* / claude-{sonnet,opus}-4-* are not supported
+        "remote::azure",  # {'error': {'code': 'OperationNotSupported', 'message': 'The completion operation
+        #  does not work with the specified model, gpt-5-mini. Please choose different model and try
+        #  again. You can learn more about which models can be used with each operation here:
+        #  https://go.microsoft.com/fwlink/?linkid=2197993.'}}"}
     ):
         pytest.skip(f"Model {model_id} hosted by {provider.provider_type} doesn't support OpenAI completions.")
 
@@ -157,7 +174,8 @@ def test_openai_completion_non_streaming_suffix(llama_stack_client, client_with_
     assert len(response.choices) > 0
     choice = response.choices[0]
     assert len(choice.text) > 5
-    assert "france" in choice.text.lower()
+    normalized_text = _normalize_text(choice.text)
+    assert "france" in normalized_text
 
 
 @pytest.mark.parametrize(
@@ -248,7 +266,9 @@ def test_openai_chat_completion_non_streaming(compat_client, client_with_models,
     )
     message_content = response.choices[0].message.content.lower().strip()
     assert len(message_content) > 0
-    assert expected.lower() in message_content
+    normalized_expected = _normalize_text(expected)
+    normalized_content = _normalize_text(message_content)
+    assert normalized_expected in normalized_content
 
 
 @pytest.mark.parametrize(
@@ -272,10 +292,13 @@ def test_openai_chat_completion_streaming(compat_client, client_with_models, tex
     )
     streamed_content = []
     for chunk in response:
-        if chunk.choices[0].delta.content:
+        # On some providers like Azure, the choices are empty on the first chunk, so we need to check for that
+        if chunk.choices and len(chunk.choices) > 0 and chunk.choices[0].delta.content:
             streamed_content.append(chunk.choices[0].delta.content.lower().strip())
     assert len(streamed_content) > 0
-    assert expected.lower() in "".join(streamed_content)
+    normalized_expected = _normalize_text(expected)
+    normalized_content = _normalize_text("".join(streamed_content))
+    assert normalized_expected in normalized_content
 
 
 @pytest.mark.parametrize(
@@ -308,8 +331,12 @@ def test_openai_chat_completion_streaming_with_n(compat_client, client_with_mode
                     streamed_content.get(choice.index, "") + choice.delta.content.lower().strip()
                 )
     assert len(streamed_content) == 2
+    normalized_expected = _normalize_text(expected)
     for i, content in streamed_content.items():
-        assert expected.lower() in content, f"Choice {i}: Expected {expected.lower()} in {content}"
+        normalized_content = _normalize_text(content)
+        assert normalized_expected in normalized_content, (
+            f"Choice {i}: Expected {normalized_expected} in {normalized_content}"
+        )
 
 
 @pytest.mark.parametrize(
@@ -339,9 +366,9 @@ def test_inference_store(compat_client, client_with_models, text_model_id, strea
         content = ""
         response_id = None
         for chunk in response:
-            if response_id is None:
+            if response_id is None and chunk.id:
                 response_id = chunk.id
-            if chunk.choices[0].delta.content:
+            if chunk.choices and len(chunk.choices) > 0 and chunk.choices[0].delta.content:
                 content += chunk.choices[0].delta.content
     else:
         response_id = response.id
@@ -410,11 +437,12 @@ def test_inference_store_tool_calls(compat_client, client_with_models, text_mode
         content = ""
         response_id = None
         for chunk in response:
-            if response_id is None:
+            if response_id is None and chunk.id:
                 response_id = chunk.id
-            if delta := chunk.choices[0].delta:
-                if delta.content:
-                    content += delta.content
+            if chunk.choices and len(chunk.choices) > 0:
+                if delta := chunk.choices[0].delta:
+                    if delta.content:
+                        content += delta.content
     else:
         response_id = response.id
         content = response.choices[0].message.content
@@ -484,4 +512,5 @@ def test_openai_chat_completion_non_streaming_with_file(openai_client, client_wi
         stream=False,
     )
     message_content = response.choices[0].message.content.lower().strip()
-    assert "hello world" in message_content
+    normalized_content = _normalize_text(message_content)
+    assert "hello world" in normalized_content
diff --git a/tests/integration/inference/test_text_inference.py b/tests/integration/inference/test_text_inference.py
index d7ffe5929..621084231 100644
--- a/tests/integration/inference/test_text_inference.py
+++ b/tests/integration/inference/test_text_inference.py
@@ -32,6 +32,7 @@ def skip_if_model_doesnt_support_completion(client_with_models, model_id):
             "remote::vertexai",
             "remote::groq",
             "remote::sambanova",
+            "remote::azure",
         )
         or "openai-compat" in provider.provider_type
     ):
@@ -44,7 +45,7 @@ def skip_if_model_doesnt_support_json_schema_structured_output(client_with_model
     provider_id = models[model_id].provider_id
     providers = {p.provider_id: p for p in client_with_models.providers.list()}
     provider = providers[provider_id]
-    if provider.provider_type in ("remote::sambanova",):
+    if provider.provider_type in ("remote::sambanova", "remote::azure"):
         pytest.skip(
             f"Model {model_id} hosted by {provider.provider_type} doesn't support json_schema structured output"
         )
diff --git a/tests/integration/recordings/responses/0fda25b9241c.json b/tests/integration/recordings/responses/0fda25b9241c.json
new file mode 100644
index 000000000..b97ee1670
--- /dev/null
+++ b/tests/integration/recordings/responses/0fda25b9241c.json
@@ -0,0 +1,71 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "Which planet do humans live on?"
+        }
+      ],
+      "stream": false
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": {
+      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
+      "__data__": {
+        "id": "chatcmpl-CECIXqfvjuluKkZtG3q2QJoSQhBU0",
+        "choices": [
+          {
+            "finish_reason": "stop",
+            "index": 0,
+            "logprobs": null,
+            "message": {
+              "content": "Humans live on Earth \u2014 the third planet from the Sun. It's the only known planet that naturally supports life, with a breathable atmosphere, liquid water, and temperatures suitable for living organisms.",
+              "refusal": null,
+              "role": "assistant",
+              "annotations": [],
+              "audio": null,
+              "function_call": null,
+              "tool_calls": null
+            },
+            "content_filter_results": {}
+          }
+        ],
+        "created": 1757499901,
+        "model": "gpt-5-mini-2025-08-07",
+        "object": "chat.completion",
+        "service_tier": null,
+        "system_fingerprint": null,
+        "usage": {
+          "completion_tokens": 112,
+          "prompt_tokens": 13,
+          "total_tokens": 125,
+          "completion_tokens_details": {
+            "accepted_prediction_tokens": 0,
+            "audio_tokens": 0,
+            "reasoning_tokens": 64,
+            "rejected_prediction_tokens": 0
+          },
+          "prompt_tokens_details": {
+            "audio_tokens": 0,
+            "cached_tokens": 0
+          }
+        },
+        "prompt_filter_results": [
+          {
+            "prompt_index": 0,
+            "content_filter_results": {}
+          }
+        ]
+      }
+    },
+    "is_streaming": false
+  }
+}
diff --git a/tests/integration/recordings/responses/2b2ad549510d.json b/tests/integration/recordings/responses/2b2ad549510d.json
new file mode 100644
index 000000000..55a9d6426
--- /dev/null
+++ b/tests/integration/recordings/responses/2b2ad549510d.json
@@ -0,0 +1,448 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "Hello, world!"
+        }
+      ],
+      "stream": true
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": [
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "",
+          "choices": [],
+          "created": 0,
+          "model": "",
+          "object": "",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null,
+          "prompt_filter_results": [
+            {
+              "prompt_index": 0,
+              "content_filter_results": {}
+            }
+          ]
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": "",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": "Hello",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " world",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": "!",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " Hi",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " \u2014",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " how",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " can",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " I",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " help",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " you",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": " today",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": "?",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIgeXOClAuSm8xHAS6CYQ87lB8O",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "stop",
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499910,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      }
+    ],
+    "is_streaming": true
+  }
+}
diff --git a/tests/integration/recordings/responses/57b67d1b1a36.json b/tests/integration/recordings/responses/57b67d1b1a36.json
new file mode 100644
index 000000000..14de1d85e
--- /dev/null
+++ b/tests/integration/recordings/responses/57b67d1b1a36.json
@@ -0,0 +1,71 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "Which planet has rings around it with a name starting with letter S?"
+        }
+      ],
+      "stream": false
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": {
+      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
+      "__data__": {
+        "id": "chatcmpl-CECIkT5cbqFazpungtewksVePcUNa",
+        "choices": [
+          {
+            "finish_reason": "stop",
+            "index": 0,
+            "logprobs": null,
+            "message": {
+              "content": "Saturn. It's the planet famous for its prominent ring system made of ice and rock.",
+              "refusal": null,
+              "role": "assistant",
+              "annotations": [],
+              "audio": null,
+              "function_call": null,
+              "tool_calls": null
+            },
+            "content_filter_results": {}
+          }
+        ],
+        "created": 1757499914,
+        "model": "gpt-5-mini-2025-08-07",
+        "object": "chat.completion",
+        "service_tier": null,
+        "system_fingerprint": null,
+        "usage": {
+          "completion_tokens": 156,
+          "prompt_tokens": 20,
+          "total_tokens": 176,
+          "completion_tokens_details": {
+            "accepted_prediction_tokens": 0,
+            "audio_tokens": 0,
+            "reasoning_tokens": 128,
+            "rejected_prediction_tokens": 0
+          },
+          "prompt_tokens_details": {
+            "audio_tokens": 0,
+            "cached_tokens": 0
+          }
+        },
+        "prompt_filter_results": [
+          {
+            "prompt_index": 0,
+            "content_filter_results": {}
+          }
+        ]
+      }
+    },
+    "is_streaming": false
+  }
+}
diff --git a/tests/integration/recordings/responses/8752115f8d0c.json b/tests/integration/recordings/responses/8752115f8d0c.json
new file mode 100644
index 000000000..0e88bbfa6
--- /dev/null
+++ b/tests/integration/recordings/responses/8752115f8d0c.json
@@ -0,0 +1,71 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "Hello, world!"
+        }
+      ],
+      "stream": false
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": {
+      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
+      "__data__": {
+        "id": "chatcmpl-CECIuyylsMNXspa83k8LrD8SQadNY",
+        "choices": [
+          {
+            "finish_reason": "stop",
+            "index": 0,
+            "logprobs": null,
+            "message": {
+              "content": "Hello! \ud83d\udc4b How can I help you today \u2014 answer a question, write or edit something, debug code, brainstorm ideas, or anything else?",
+              "refusal": null,
+              "role": "assistant",
+              "annotations": [],
+              "audio": null,
+              "function_call": null,
+              "tool_calls": null
+            },
+            "content_filter_results": {}
+          }
+        ],
+        "created": 1757499924,
+        "model": "gpt-5-mini-2025-08-07",
+        "object": "chat.completion",
+        "service_tier": null,
+        "system_fingerprint": null,
+        "usage": {
+          "completion_tokens": 40,
+          "prompt_tokens": 10,
+          "total_tokens": 50,
+          "completion_tokens_details": {
+            "accepted_prediction_tokens": 0,
+            "audio_tokens": 0,
+            "reasoning_tokens": 0,
+            "rejected_prediction_tokens": 0
+          },
+          "prompt_tokens_details": {
+            "audio_tokens": 0,
+            "cached_tokens": 0
+          }
+        },
+        "prompt_filter_results": [
+          {
+            "prompt_index": 0,
+            "content_filter_results": {}
+          }
+        ]
+      }
+    },
+    "is_streaming": false
+  }
+}
diff --git a/tests/integration/recordings/responses/94d11daee205.json b/tests/integration/recordings/responses/94d11daee205.json
new file mode 100644
index 000000000..b6a6c3d68
--- /dev/null
+++ b/tests/integration/recordings/responses/94d11daee205.json
@@ -0,0 +1,1178 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "What is the name of the US captial?"
+        }
+      ],
+      "n": 2,
+      "stream": true
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": [
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "",
+          "choices": [],
+          "created": 0,
+          "model": "",
+          "object": "",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null,
+          "prompt_filter_results": [
+            {
+              "prompt_index": 0,
+              "content_filter_results": {}
+            }
+          ]
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": "",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": "",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": "The",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " capital",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " United",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " States",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": "The",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " capital",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " United",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " States",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " Washington",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " Washington",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " D",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ".C",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " D",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ".C",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": "the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " District",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": "official",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": "ly",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " Columbia",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ").",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " District",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": " Columbia",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": ").",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "stop",
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIpbpLN9VO3z9pVAidTRslxRHtL",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "stop",
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499919,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      }
+    ],
+    "is_streaming": true
+  }
+}
diff --git a/tests/integration/recordings/responses/9f3d749cc1c8.json b/tests/integration/recordings/responses/9f3d749cc1c8.json
new file mode 100644
index 000000000..9a4539ab0
--- /dev/null
+++ b/tests/integration/recordings/responses/9f3d749cc1c8.json
@@ -0,0 +1,1150 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "What's the name of the Sun in latin?"
+        }
+      ],
+      "stream": true
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": [
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "",
+          "choices": [],
+          "created": 0,
+          "model": "",
+          "object": "",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null,
+          "prompt_filter_results": [
+            {
+              "prompt_index": 0,
+              "content_filter_results": {}
+            }
+          ]
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "The",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " Latin",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " name",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "Sol",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "\"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "gen",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "itive",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "S",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "olis",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "\").",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " It's",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " used",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " as",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " proper",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " name",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " Sun",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": ";",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " poets",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " also",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " sometimes",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " used",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " Greek",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "-derived",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " ep",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "ithe",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "ts",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " like",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "Pho",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "eb",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": "us",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": ".\"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIZYHVRY3J0EiPODz10HVzL7cIe",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "stop",
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499903,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      }
+    ],
+    "is_streaming": true
+  }
+}
diff --git a/tests/integration/recordings/responses/c791119e6359.json b/tests/integration/recordings/responses/c791119e6359.json
new file mode 100644
index 000000000..6ac123e92
--- /dev/null
+++ b/tests/integration/recordings/responses/c791119e6359.json
@@ -0,0 +1,98 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "What's the weather in Tokyo? Use the get_weather function to get the weather."
+        }
+      ],
+      "stream": false,
+      "tools": [
+        {
+          "type": "function",
+          "function": {
+            "name": "get_weather",
+            "description": "Get the weather in a given city",
+            "parameters": {
+              "type": "object",
+              "properties": {
+                "city": {
+                  "type": "string",
+                  "description": "The city to get the weather for"
+                }
+              }
+            }
+          }
+        }
+      ]
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": {
+      "__type__": "openai.types.chat.chat_completion.ChatCompletion",
+      "__data__": {
+        "id": "chatcmpl-CECIwq9Odd0mOJMmw7ytv8iEazH4H",
+        "choices": [
+          {
+            "finish_reason": "tool_calls",
+            "index": 0,
+            "logprobs": null,
+            "message": {
+              "content": null,
+              "refusal": null,
+              "role": "assistant",
+              "annotations": [],
+              "audio": null,
+              "function_call": null,
+              "tool_calls": [
+                {
+                  "id": "call_yw18spRc1jjUlEyabbXBhB33",
+                  "function": {
+                    "arguments": "{\"city\":\"Tokyo\"}",
+                    "name": "get_weather"
+                  },
+                  "type": "function"
+                }
+              ]
+            },
+            "content_filter_results": {}
+          }
+        ],
+        "created": 1757499926,
+        "model": "gpt-5-mini-2025-08-07",
+        "object": "chat.completion",
+        "service_tier": null,
+        "system_fingerprint": null,
+        "usage": {
+          "completion_tokens": 88,
+          "prompt_tokens": 151,
+          "total_tokens": 239,
+          "completion_tokens_details": {
+            "accepted_prediction_tokens": 0,
+            "audio_tokens": 0,
+            "reasoning_tokens": 64,
+            "rejected_prediction_tokens": 0
+          },
+          "prompt_tokens_details": {
+            "audio_tokens": 0,
+            "cached_tokens": 0
+          }
+        },
+        "prompt_filter_results": [
+          {
+            "prompt_index": 0,
+            "content_filter_results": {}
+          }
+        ]
+      }
+    },
+    "is_streaming": false
+  }
+}
diff --git a/tests/integration/recordings/responses/d3e27b7234e2.json b/tests/integration/recordings/responses/d3e27b7234e2.json
new file mode 100644
index 000000000..7f266c392
--- /dev/null
+++ b/tests/integration/recordings/responses/d3e27b7234e2.json
@@ -0,0 +1,2150 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "What's the name of the Sun in latin?"
+        }
+      ],
+      "n": 2,
+      "stream": true
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": [
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "",
+          "choices": [],
+          "created": 0,
+          "model": "",
+          "object": "",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null,
+          "prompt_filter_results": [
+            {
+              "prompt_index": 0,
+              "content_filter_results": {}
+            }
+          ]
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "In",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " Latin",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " Sun",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " called",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "Sol",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "\"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "sol",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " gen",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "itive",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " sol",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "The",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " Latin",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " name",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " masculine",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": ").",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "Sol",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "\"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " The",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " name",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "s",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " also",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u014d",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " used",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "l",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " for",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "),",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " gen",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " Roman",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "itive",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " sun",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " god",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "s",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u014d",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "e",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "lis",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": ".g",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "\".",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": ".,",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " ",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " Sol",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " As",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " Inv",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " an",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "ict",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " epit",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "us",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "het",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": ").",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " it",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "\u2019s",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " also",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " called",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " \"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "Pho",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "eb",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "us",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": "\"",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " in",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": " poetry",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "stop",
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIdmgM7bbQr6YefuUbY4cycibvm",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "stop",
+              "index": 1,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499907,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      }
+    ],
+    "is_streaming": true
+  }
+}
diff --git a/tests/integration/recordings/responses/fb785db7fafd.json b/tests/integration/recordings/responses/fb785db7fafd.json
new file mode 100644
index 000000000..086d211e8
--- /dev/null
+++ b/tests/integration/recordings/responses/fb785db7fafd.json
@@ -0,0 +1,310 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "What's the weather in Tokyo? Use the get_weather function to get the weather."
+        }
+      ],
+      "stream": true,
+      "tools": [
+        {
+          "type": "function",
+          "function": {
+            "name": "get_weather",
+            "description": "Get the weather in a given city",
+            "parameters": {
+              "type": "object",
+              "properties": {
+                "city": {
+                  "type": "string",
+                  "description": "The city to get the weather for"
+                }
+              }
+            }
+          }
+        }
+      ]
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": [
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "",
+          "choices": [],
+          "created": 0,
+          "model": "",
+          "object": "",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null,
+          "prompt_filter_results": [
+            {
+              "prompt_index": 0,
+              "content_filter_results": {}
+            }
+          ]
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIiMMWyfACuKUYWEyYSazcnvRVo",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": [
+                  {
+                    "index": 0,
+                    "id": "call_TMbEoYn9q0ZKtoxav5LpD9Ts",
+                    "function": {
+                      "arguments": "",
+                      "name": "get_weather"
+                    },
+                    "type": "function"
+                  }
+                ]
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499912,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIiMMWyfACuKUYWEyYSazcnvRVo",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": [
+                  {
+                    "index": 0,
+                    "id": null,
+                    "function": {
+                      "arguments": "{\"",
+                      "name": null
+                    },
+                    "type": null
+                  }
+                ]
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499912,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIiMMWyfACuKUYWEyYSazcnvRVo",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": [
+                  {
+                    "index": 0,
+                    "id": null,
+                    "function": {
+                      "arguments": "city",
+                      "name": null
+                    },
+                    "type": null
+                  }
+                ]
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499912,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIiMMWyfACuKUYWEyYSazcnvRVo",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": [
+                  {
+                    "index": 0,
+                    "id": null,
+                    "function": {
+                      "arguments": "\":\"",
+                      "name": null
+                    },
+                    "type": null
+                  }
+                ]
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499912,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIiMMWyfACuKUYWEyYSazcnvRVo",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": [
+                  {
+                    "index": 0,
+                    "id": null,
+                    "function": {
+                      "arguments": "Tokyo",
+                      "name": null
+                    },
+                    "type": null
+                  }
+                ]
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499912,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIiMMWyfACuKUYWEyYSazcnvRVo",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": [
+                  {
+                    "index": 0,
+                    "id": null,
+                    "function": {
+                      "arguments": "\"}",
+                      "name": null
+                    },
+                    "type": null
+                  }
+                ]
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499912,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECIiMMWyfACuKUYWEyYSazcnvRVo",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "tool_calls",
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499912,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      }
+    ],
+    "is_streaming": true
+  }
+}
diff --git a/tests/integration/recordings/responses/ff3271401fb4.json b/tests/integration/recordings/responses/ff3271401fb4.json
new file mode 100644
index 000000000..bf7ec89f7
--- /dev/null
+++ b/tests/integration/recordings/responses/ff3271401fb4.json
@@ -0,0 +1,556 @@
+{
+  "request": {
+    "method": "POST",
+    "url": "https://shan-mfbb618r-eastus2.cognitiveservices.azure.com/openai/v1/v1/chat/completions",
+    "headers": {},
+    "body": {
+      "model": "gpt-5-mini",
+      "messages": [
+        {
+          "role": "user",
+          "content": "What is the name of the US captial?"
+        }
+      ],
+      "stream": true
+    },
+    "endpoint": "/v1/chat/completions",
+    "model": "gpt-5-mini"
+  },
+  "response": {
+    "body": [
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "",
+          "choices": [],
+          "created": 0,
+          "model": "",
+          "object": "",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null,
+          "prompt_filter_results": [
+            {
+              "prompt_index": 0,
+              "content_filter_results": {}
+            }
+          ]
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": "",
+                "function_call": null,
+                "refusal": null,
+                "role": "assistant",
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": "The",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " capital",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " the",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " United",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " States",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " is",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " Washington",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": ",",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " D",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": ".C",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": ".",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " (",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": "District",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " of",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": " Columbia",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": ").",
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": null,
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      },
+      {
+        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
+        "__data__": {
+          "id": "chatcmpl-CECImr5TLfMFiZN3FUlfVdBLr51Fs",
+          "choices": [
+            {
+              "delta": {
+                "content": null,
+                "function_call": null,
+                "refusal": null,
+                "role": null,
+                "tool_calls": null
+              },
+              "finish_reason": "stop",
+              "index": 0,
+              "logprobs": null,
+              "content_filter_results": {}
+            }
+          ],
+          "created": 1757499916,
+          "model": "gpt-5-mini-2025-08-07",
+          "object": "chat.completion.chunk",
+          "service_tier": null,
+          "system_fingerprint": null,
+          "usage": null
+        }
+      }
+    ],
+    "is_streaming": true
+  }
+}

From d15368a3026450d1474f4a4db47b89fd3e6057ca Mon Sep 17 00:00:00 2001
From: Francisco Arceo <arceofrancisco@gmail.com>
Date: Thu, 11 Sep 2025 06:20:11 -0600
Subject: [PATCH 74/76] chore: Updating documentation, adding exception
 handling for Vector Stores in RAG Tool, more tests on migration, and migrate
 off of inference_api for context_retriever for RAG (#3367)

# What does this PR do?

- Updating documentation on migration from RAG Tool to Vector Stores and
Files APIs
- Adding exception handling for Vector Stores in RAG Tool
- Add more tests on migration from RAG Tool to Vector Stores
- Migrate off of inference_api for context_retriever for RAG

<!-- If resolving an issue, uncomment and update the line below -->
<!-- Closes #[issue-number] -->

## Test Plan
Integration and unit tests added

Signed-off-by: Francisco Javier Arceo <farceo@redhat.com>
---
 docs/source/building_applications/rag.md      |  21 ++
 .../tool_runtime/rag/context_retriever.py     |  12 +-
 .../inline/tool_runtime/rag/memory.py         | 121 ++++++----
 .../integration/tool_runtime/test_rag_tool.py | 208 ++++++++++++++++++
 .../utils/memory/test_vector_store.py         |  38 ++++
 5 files changed, 355 insertions(+), 45 deletions(-)

diff --git a/docs/source/building_applications/rag.md b/docs/source/building_applications/rag.md
index 289c38991..802859e87 100644
--- a/docs/source/building_applications/rag.md
+++ b/docs/source/building_applications/rag.md
@@ -93,10 +93,31 @@ chunks_response = client.vector_io.query(
 
 ### Using the RAG Tool
 
+> **⚠️ DEPRECATION NOTICE**: The RAG Tool is being deprecated in favor of directly using the OpenAI-compatible Search
+> API. We recommend migrating to the OpenAI APIs for better compatibility and future support.
+
 A better way to ingest documents is to use the RAG Tool. This tool allows you to ingest documents from URLs, files, etc.
 and automatically chunks them into smaller pieces. More examples for how to format a RAGDocument can be found in the
 [appendix](#more-ragdocument-examples).
 
+#### OpenAI API Integration & Migration
+
+The RAG tool has been updated to use OpenAI-compatible APIs. This provides several benefits:
+
+- **Files API Integration**: Documents are now uploaded using OpenAI's file upload endpoints
+- **Vector Stores API**: Vector storage operations use OpenAI's vector store format with configurable chunking strategies
+- **Error Resilience:** When processing multiple documents, individual failures are logged but don't crash the operation. Failed documents are skipped while successful ones continue processing.
+
+**Migration Path:**
+We recommend migrating to the OpenAI-compatible Search API for:
+1. **Better OpenAI Ecosystem Integration**: Direct compatibility with OpenAI tools and workflows including the Responses API
+2**Future-Proof**: Continued support and feature development
+3**Full OpenAI Compatibility**: Vector Stores, Files, and Search APIs are fully compatible with OpenAI's Responses API
+
+The OpenAI APIs are used under the hood, so you can continue to use your existing RAG Tool code with minimal changes.
+However, we recommend updating your code to use the new OpenAI-compatible APIs for better long-term support. If any
+documents  fail to process, they will be logged in the response but will not cause the entire operation to fail.
+
 ```python
 from llama_stack_client import RAGDocument
 
diff --git a/llama_stack/providers/inline/tool_runtime/rag/context_retriever.py b/llama_stack/providers/inline/tool_runtime/rag/context_retriever.py
index be18430e4..9bc22f979 100644
--- a/llama_stack/providers/inline/tool_runtime/rag/context_retriever.py
+++ b/llama_stack/providers/inline/tool_runtime/rag/context_retriever.py
@@ -8,7 +8,7 @@
 from jinja2 import Template
 
 from llama_stack.apis.common.content_types import InterleavedContent
-from llama_stack.apis.inference import UserMessage
+from llama_stack.apis.inference import OpenAIUserMessageParam
 from llama_stack.apis.tools.rag_tool import (
     DefaultRAGQueryGeneratorConfig,
     LLMRAGQueryGeneratorConfig,
@@ -61,16 +61,16 @@ async def llm_rag_query_generator(
         messages = [interleaved_content_as_str(content)]
 
     template = Template(config.template)
-    content = template.render({"messages": messages})
+    rendered_content: str = template.render({"messages": messages})
 
     model = config.model
-    message = UserMessage(content=content)
-    response = await inference_api.chat_completion(
-        model_id=model,
+    message = OpenAIUserMessageParam(content=rendered_content)
+    response = await inference_api.openai_chat_completion(
+        model=model,
         messages=[message],
         stream=False,
     )
 
-    query = response.completion_message.content
+    query = response.choices[0].message.content
 
     return query
diff --git a/llama_stack/providers/inline/tool_runtime/rag/memory.py b/llama_stack/providers/inline/tool_runtime/rag/memory.py
index aa629cca8..bc68f198d 100644
--- a/llama_stack/providers/inline/tool_runtime/rag/memory.py
+++ b/llama_stack/providers/inline/tool_runtime/rag/memory.py
@@ -45,10 +45,7 @@ from llama_stack.apis.vector_io import (
 from llama_stack.log import get_logger
 from llama_stack.providers.datatypes import ToolGroupsProtocolPrivate
 from llama_stack.providers.utils.inference.prompt_adapter import interleaved_content_as_str
-from llama_stack.providers.utils.memory.vector_store import (
-    content_from_doc,
-    parse_data_url,
-)
+from llama_stack.providers.utils.memory.vector_store import parse_data_url
 
 from .config import RagToolRuntimeConfig
 from .context_retriever import generate_rag_query
@@ -60,6 +57,47 @@ def make_random_string(length: int = 8):
     return "".join(secrets.choice(string.ascii_letters + string.digits) for _ in range(length))
 
 
+async def raw_data_from_doc(doc: RAGDocument) -> tuple[bytes, str]:
+    """Get raw binary data and mime type from a RAGDocument for file upload."""
+    if isinstance(doc.content, URL):
+        if doc.content.uri.startswith("data:"):
+            parts = parse_data_url(doc.content.uri)
+            mime_type = parts["mimetype"]
+            data = parts["data"]
+
+            if parts["is_base64"]:
+                file_data = base64.b64decode(data)
+            else:
+                file_data = data.encode("utf-8")
+
+            return file_data, mime_type
+        else:
+            async with httpx.AsyncClient() as client:
+                r = await client.get(doc.content.uri)
+                r.raise_for_status()
+                mime_type = r.headers.get("content-type", "application/octet-stream")
+                return r.content, mime_type
+    else:
+        if isinstance(doc.content, str):
+            content_str = doc.content
+        else:
+            content_str = interleaved_content_as_str(doc.content)
+
+        if content_str.startswith("data:"):
+            parts = parse_data_url(content_str)
+            mime_type = parts["mimetype"]
+            data = parts["data"]
+
+            if parts["is_base64"]:
+                file_data = base64.b64decode(data)
+            else:
+                file_data = data.encode("utf-8")
+
+            return file_data, mime_type
+        else:
+            return content_str.encode("utf-8"), "text/plain"
+
+
 class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRuntime):
     def __init__(
         self,
@@ -95,46 +133,52 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
             return
 
         for doc in documents:
-            if isinstance(doc.content, URL):
-                if doc.content.uri.startswith("data:"):
-                    parts = parse_data_url(doc.content.uri)
-                    file_data = base64.b64decode(parts["data"]) if parts["is_base64"] else parts["data"].encode()
-                    mime_type = parts["mimetype"]
-                else:
-                    async with httpx.AsyncClient() as client:
-                        response = await client.get(doc.content.uri)
-                        file_data = response.content
-                        mime_type = doc.mime_type or response.headers.get("content-type", "application/octet-stream")
-            else:
-                content_str = await content_from_doc(doc)
-                file_data = content_str.encode("utf-8")
-                mime_type = doc.mime_type or "text/plain"
+            try:
+                try:
+                    file_data, mime_type = await raw_data_from_doc(doc)
+                except Exception as e:
+                    log.error(f"Failed to extract content from document {doc.document_id}: {e}")
+                    continue
 
-            file_extension = mimetypes.guess_extension(mime_type) or ".txt"
-            filename = doc.metadata.get("filename", f"{doc.document_id}{file_extension}")
+                file_extension = mimetypes.guess_extension(mime_type) or ".txt"
+                filename = doc.metadata.get("filename", f"{doc.document_id}{file_extension}")
 
-            file_obj = io.BytesIO(file_data)
-            file_obj.name = filename
+                file_obj = io.BytesIO(file_data)
+                file_obj.name = filename
 
-            upload_file = UploadFile(file=file_obj, filename=filename)
+                upload_file = UploadFile(file=file_obj, filename=filename)
 
-            created_file = await self.files_api.openai_upload_file(
-                file=upload_file, purpose=OpenAIFilePurpose.ASSISTANTS
-            )
+                try:
+                    created_file = await self.files_api.openai_upload_file(
+                        file=upload_file, purpose=OpenAIFilePurpose.ASSISTANTS
+                    )
+                except Exception as e:
+                    log.error(f"Failed to upload file for document {doc.document_id}: {e}")
+                    continue
 
-            chunking_strategy = VectorStoreChunkingStrategyStatic(
-                static=VectorStoreChunkingStrategyStaticConfig(
-                    max_chunk_size_tokens=chunk_size_in_tokens,
-                    chunk_overlap_tokens=chunk_size_in_tokens // 4,
+                chunking_strategy = VectorStoreChunkingStrategyStatic(
+                    static=VectorStoreChunkingStrategyStaticConfig(
+                        max_chunk_size_tokens=chunk_size_in_tokens,
+                        chunk_overlap_tokens=chunk_size_in_tokens // 4,
+                    )
                 )
-            )
 
-            await self.vector_io_api.openai_attach_file_to_vector_store(
-                vector_store_id=vector_db_id,
-                file_id=created_file.id,
-                attributes=doc.metadata,
-                chunking_strategy=chunking_strategy,
-            )
+                try:
+                    await self.vector_io_api.openai_attach_file_to_vector_store(
+                        vector_store_id=vector_db_id,
+                        file_id=created_file.id,
+                        attributes=doc.metadata,
+                        chunking_strategy=chunking_strategy,
+                    )
+                except Exception as e:
+                    log.error(
+                        f"Failed to attach file {created_file.id} to vector store {vector_db_id} for document {doc.document_id}: {e}"
+                    )
+                    continue
+
+            except Exception as e:
+                log.error(f"Unexpected error processing document {doc.document_id}: {e}")
+                continue
 
     async def query(
         self,
@@ -274,7 +318,6 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
         if query_config:
             query_config = TypeAdapter(RAGQueryConfig).validate_python(query_config)
         else:
-            # handle someone passing an empty dict
             query_config = RAGQueryConfig()
 
         query = kwargs["query"]
@@ -285,6 +328,6 @@ class MemoryToolRuntimeImpl(ToolGroupsProtocolPrivate, ToolRuntime, RAGToolRunti
         )
 
         return ToolInvocationResult(
-            content=result.content,
+            content=result.content or [],
             metadata=result.metadata,
         )
diff --git a/tests/integration/tool_runtime/test_rag_tool.py b/tests/integration/tool_runtime/test_rag_tool.py
index b208500d8..b78c39af8 100644
--- a/tests/integration/tool_runtime/test_rag_tool.py
+++ b/tests/integration/tool_runtime/test_rag_tool.py
@@ -183,6 +183,110 @@ def test_vector_db_insert_from_url_and_query(
     assert any("llama2" in chunk.content.lower() for chunk in response2.chunks)
 
 
+def test_rag_tool_openai_apis(client_with_empty_registry, embedding_model_id, embedding_dimension):
+    vector_db_id = "test_openai_vector_db"
+
+    client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_id,
+        embedding_model=embedding_model_id,
+        embedding_dimension=embedding_dimension,
+    )
+
+    available_vector_dbs = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
+    actual_vector_db_id = available_vector_dbs[0]
+
+    # different document formats that should work with OpenAI APIs
+    documents = [
+        Document(
+            document_id="text-doc",
+            content="This is a plain text document about machine learning algorithms.",
+            metadata={"type": "text", "category": "AI"},
+        ),
+        Document(
+            document_id="url-doc",
+            content="https://raw.githubusercontent.com/pytorch/torchtune/main/docs/source/tutorials/chat.rst",
+            mime_type="text/plain",
+            metadata={"type": "url", "source": "pytorch"},
+        ),
+        Document(
+            document_id="data-url-doc",
+            content="data:text/plain;base64,VGhpcyBpcyBhIGRhdGEgVVJMIGRvY3VtZW50IGFib3V0IGRlZXAgbGVhcm5pbmcu",  # "This is a data URL document about deep learning."
+            metadata={"type": "data_url", "encoding": "base64"},
+        ),
+    ]
+
+    client_with_empty_registry.tool_runtime.rag_tool.insert(
+        documents=documents,
+        vector_db_id=actual_vector_db_id,
+        chunk_size_in_tokens=256,
+    )
+
+    files_list = client_with_empty_registry.files.list()
+    assert len(files_list.data) >= len(documents), (
+        f"Expected at least {len(documents)} files, got {len(files_list.data)}"
+    )
+
+    vector_store_files = client_with_empty_registry.vector_io.openai_list_files_in_vector_store(
+        vector_store_id=actual_vector_db_id
+    )
+    assert len(vector_store_files.data) >= len(documents), f"Expected at least {len(documents)} files in vector store"
+
+    response = client_with_empty_registry.tool_runtime.rag_tool.query(
+        vector_db_ids=[actual_vector_db_id],
+        content="Tell me about machine learning and deep learning",
+    )
+
+    assert_valid_text_response(response)
+    content_text = " ".join([chunk.text for chunk in response.content]).lower()
+    assert "machine learning" in content_text or "deep learning" in content_text
+
+
+def test_rag_tool_exception_handling(client_with_empty_registry, embedding_model_id, embedding_dimension):
+    vector_db_id = "test_exception_handling"
+
+    client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_id,
+        embedding_model=embedding_model_id,
+        embedding_dimension=embedding_dimension,
+    )
+
+    available_vector_dbs = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
+    actual_vector_db_id = available_vector_dbs[0]
+
+    documents = [
+        Document(
+            document_id="valid-doc",
+            content="This is a valid document that should be processed successfully.",
+            metadata={"status": "valid"},
+        ),
+        Document(
+            document_id="invalid-url-doc",
+            content="https://nonexistent-domain-12345.com/invalid.txt",
+            metadata={"status": "invalid_url"},
+        ),
+        Document(
+            document_id="another-valid-doc",
+            content="This is another valid document for testing resilience.",
+            metadata={"status": "valid"},
+        ),
+    ]
+
+    client_with_empty_registry.tool_runtime.rag_tool.insert(
+        documents=documents,
+        vector_db_id=actual_vector_db_id,
+        chunk_size_in_tokens=256,
+    )
+
+    response = client_with_empty_registry.tool_runtime.rag_tool.query(
+        vector_db_ids=[actual_vector_db_id],
+        content="valid document",
+    )
+
+    assert_valid_text_response(response)
+    content_text = " ".join([chunk.text for chunk in response.content]).lower()
+    assert "valid document" in content_text
+
+
 def test_rag_tool_insert_and_query(client_with_empty_registry, embedding_model_id, embedding_dimension):
     providers = [p for p in client_with_empty_registry.providers.list() if p.api == "vector_io"]
     assert len(providers) > 0
@@ -249,3 +353,107 @@ def test_rag_tool_insert_and_query(client_with_empty_registry, embedding_model_i
                 "chunk_template": "This should raise a ValueError because it is missing the proper template variables",
             },
         )
+
+
+def test_rag_tool_query_generation(client_with_empty_registry, embedding_model_id, embedding_dimension):
+    vector_db_id = "test_query_generation_db"
+
+    client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_id,
+        embedding_model=embedding_model_id,
+        embedding_dimension=embedding_dimension,
+    )
+
+    available_vector_dbs = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
+    actual_vector_db_id = available_vector_dbs[0]
+
+    documents = [
+        Document(
+            document_id="ai-doc",
+            content="Artificial intelligence and machine learning are transforming technology.",
+            metadata={"category": "AI"},
+        ),
+        Document(
+            document_id="banana-doc",
+            content="Don't bring a banana to a knife fight.",
+            metadata={"category": "wisdom"},
+        ),
+    ]
+
+    client_with_empty_registry.tool_runtime.rag_tool.insert(
+        documents=documents,
+        vector_db_id=actual_vector_db_id,
+        chunk_size_in_tokens=256,
+    )
+
+    response = client_with_empty_registry.tool_runtime.rag_tool.query(
+        vector_db_ids=[actual_vector_db_id],
+        content="Tell me about AI",
+    )
+
+    assert_valid_text_response(response)
+    content_text = " ".join([chunk.text for chunk in response.content]).lower()
+    assert "artificial intelligence" in content_text or "machine learning" in content_text
+
+
+def test_rag_tool_pdf_data_url_handling(client_with_empty_registry, embedding_model_id, embedding_dimension):
+    vector_db_id = "test_pdf_data_url_db"
+
+    client_with_empty_registry.vector_dbs.register(
+        vector_db_id=vector_db_id,
+        embedding_model=embedding_model_id,
+        embedding_dimension=embedding_dimension,
+    )
+
+    available_vector_dbs = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
+    actual_vector_db_id = available_vector_dbs[0]
+
+    sample_pdf = b"%PDF-1.3\n3 0 obj\n<</Type /Page\n/Parent 1 0 R\n/Resources 2 0 R\n/Contents 4 0 R>>\nendobj\n4 0 obj\n<</Filter /FlateDecode /Length 115>>\nstream\nx\x9c\x15\xcc1\x0e\x820\x18@\xe1\x9dS\xbcM]jk$\xd5\xd5(\x83!\x86\xa1\x17\xf8\xa3\xa5`LIh+\xd7W\xc6\xf7\r\xef\xc0\xbd\xd2\xaa\xb6,\xd5\xc5\xb1o\x0c\xa6VZ\xe3znn%\xf3o\xab\xb1\xe7\xa3:Y\xdc\x8bm\xeb\xf3&1\xc8\xd7\xd3\x97\xc82\xe6\x81\x87\xe42\xcb\x87Vb(\x12<\xdd<=}Jc\x0cL\x91\xee\xda$\xb5\xc3\xbd\xd7\xe9\x0f\x8d\x97 $\nendstream\nendobj\n1 0 obj\n<</Type /Pages\n/Kids [3 0 R ]\n/Count 1\n/MediaBox [0 0 595.28 841.89]\n>>\nendobj\n5 0 obj\n<</Type /Font\n/BaseFont /Helvetica\n/Subtype /Type1\n/Encoding /WinAnsiEncoding\n>>\nendobj\n2 0 obj\n<<\n/ProcSet [/PDF /Text /ImageB /ImageC /ImageI]\n/Font <<\n/F1 5 0 R\n>>\n/XObject <<\n>>\n>>\nendobj\n6 0 obj\n<<\n/Producer (PyFPDF 1.7.2 http://pyfpdf.googlecode.com/)\n/Title (This is a sample title.)\n/Author (Llama Stack Developers)\n/CreationDate (D:20250312165548)\n>>\nendobj\n7 0 obj\n<<\n/Type /Catalog\n/Pages 1 0 R\n/OpenAction [3 0 R /FitH null]\n/PageLayout /OneColumn\n>>\nendobj\nxref\n0 8\n0000000000 65535 f \n0000000272 00000 n \n0000000455 00000 n \n0000000009 00000 n \n0000000087 00000 n \n0000000359 00000 n \n0000000559 00000 n \n0000000734 00000 n \ntrailer\n<<\n/Size 8\n/Root 7 0 R\n/Info 6 0 R\n>>\nstartxref\n837\n%%EOF\n"
+
+    import base64
+
+    pdf_base64 = base64.b64encode(sample_pdf).decode("utf-8")
+    pdf_data_url = f"data:application/pdf;base64,{pdf_base64}"
+
+    documents = [
+        Document(
+            document_id="test-pdf-data-url",
+            content=pdf_data_url,
+            metadata={"type": "pdf", "source": "data_url"},
+        ),
+    ]
+
+    client_with_empty_registry.tool_runtime.rag_tool.insert(
+        documents=documents,
+        vector_db_id=actual_vector_db_id,
+        chunk_size_in_tokens=256,
+    )
+
+    files_list = client_with_empty_registry.files.list()
+    assert len(files_list.data) >= 1, "PDF should have been uploaded to Files API"
+
+    pdf_file = None
+    for file in files_list.data:
+        if file.filename and "test-pdf-data-url" in file.filename:
+            pdf_file = file
+            break
+
+    assert pdf_file is not None, "PDF file should be found in Files API"
+    assert pdf_file.bytes == len(sample_pdf), f"File size should match original PDF ({len(sample_pdf)} bytes)"
+
+    file_content = client_with_empty_registry.files.retrieve_content(pdf_file.id)
+    assert file_content.startswith(b"%PDF-"), "Retrieved file should be a valid PDF"
+
+    vector_store_files = client_with_empty_registry.vector_io.openai_list_files_in_vector_store(
+        vector_store_id=actual_vector_db_id
+    )
+    assert len(vector_store_files.data) >= 1, "PDF should be attached to vector store"
+
+    response = client_with_empty_registry.tool_runtime.rag_tool.query(
+        vector_db_ids=[actual_vector_db_id],
+        content="sample title",
+    )
+
+    assert_valid_text_response(response)
+    content_text = " ".join([chunk.text for chunk in response.content]).lower()
+    assert "sample title" in content_text or "title" in content_text
diff --git a/tests/unit/providers/utils/memory/test_vector_store.py b/tests/unit/providers/utils/memory/test_vector_store.py
index 90b229262..590bdd1d2 100644
--- a/tests/unit/providers/utils/memory/test_vector_store.py
+++ b/tests/unit/providers/utils/memory/test_vector_store.py
@@ -178,3 +178,41 @@ def test_content_from_data_and_mime_type_both_encodings_fail():
         # Should raise an exception instead of returning empty string
         with pytest.raises(UnicodeDecodeError):
             content_from_data_and_mime_type(data, mime_type)
+
+
+async def test_memory_tool_error_handling():
+    """Test that memory tool handles various failures gracefully without crashing."""
+    from llama_stack.providers.inline.tool_runtime.rag.config import RagToolRuntimeConfig
+    from llama_stack.providers.inline.tool_runtime.rag.memory import MemoryToolRuntimeImpl
+
+    config = RagToolRuntimeConfig()
+    memory_tool = MemoryToolRuntimeImpl(
+        config=config,
+        vector_io_api=AsyncMock(),
+        inference_api=AsyncMock(),
+        files_api=AsyncMock(),
+    )
+
+    docs = [
+        RAGDocument(document_id="good_doc", content="Good content", metadata={}),
+        RAGDocument(document_id="bad_url_doc", content=URL(uri="https://bad.url"), metadata={}),
+        RAGDocument(document_id="another_good_doc", content="Another good content", metadata={}),
+    ]
+
+    mock_file1 = MagicMock()
+    mock_file1.id = "file_good1"
+    mock_file2 = MagicMock()
+    mock_file2.id = "file_good2"
+    memory_tool.files_api.openai_upload_file.side_effect = [mock_file1, mock_file2]
+
+    with patch("httpx.AsyncClient") as mock_client:
+        mock_instance = AsyncMock()
+        mock_instance.get.side_effect = Exception("Bad URL")
+        mock_client.return_value.__aenter__.return_value = mock_instance
+
+        # won't raise exception despite one document failing
+        await memory_tool.insert(docs, "vector_store_123")
+
+    # processed 2 documents successfully, skipped 1
+    assert memory_tool.files_api.openai_upload_file.call_count == 2
+    assert memory_tool.vector_io_api.openai_attach_file_to_vector_store.call_count == 2

From 8ef1189be7c6ea6e9fb2e3cf3f502123e0e4635a Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Thu, 11 Sep 2025 09:04:38 -0400
Subject: [PATCH 75/76] chore: update the vLLM inference impl to use
 OpenAIMixin for openai-compat functions (#3404)

# What does this PR do?

update vLLM inference provider to use OpenAIMixin for openai-compat
functions

inference recordings from Qwen3-0.6B and vLLM 0.8.3 -
```
docker run --gpus all -v ~/.cache/huggingface:/root/.cache/huggingface -p 8000:8000 --ipc=host \
    vllm/vllm-openai:latest \
    --model Qwen/Qwen3-0.6B --enable-auto-tool-choice --tool-call-parser hermes
```

## Test Plan

```
./scripts/integration-tests.sh --stack-config server:ci-tests --setup vllm --subdirs inference
```
---
 .../providers/remote/inference/vllm/vllm.py   | 197 +-----------------
 .../providers/utils/inference/openai_mixin.py |  28 ++-
 .../providers/inference/test_remote_vllm.py   |  21 +-
 3 files changed, 44 insertions(+), 202 deletions(-)

diff --git a/llama_stack/providers/remote/inference/vllm/vllm.py b/llama_stack/providers/remote/inference/vllm/vllm.py
index 9e9a80ca5..77f5d82af 100644
--- a/llama_stack/providers/remote/inference/vllm/vllm.py
+++ b/llama_stack/providers/remote/inference/vllm/vllm.py
@@ -4,7 +4,7 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 import json
-from collections.abc import AsyncGenerator, AsyncIterator
+from collections.abc import AsyncGenerator
 from typing import Any
 
 import httpx
@@ -38,13 +38,6 @@ from llama_stack.apis.inference import (
     LogProbConfig,
     Message,
     ModelStore,
-    OpenAIChatCompletion,
-    OpenAICompletion,
-    OpenAIEmbeddingData,
-    OpenAIEmbeddingsResponse,
-    OpenAIEmbeddingUsage,
-    OpenAIMessageParam,
-    OpenAIResponseFormatParam,
     ResponseFormat,
     SamplingParams,
     TextTruncation,
@@ -71,11 +64,11 @@ from llama_stack.providers.utils.inference.openai_compat import (
     convert_message_to_openai_dict,
     convert_tool_call,
     get_sampling_options,
-    prepare_openai_completion_params,
     process_chat_completion_stream_response,
     process_completion_response,
     process_completion_stream_response,
 )
+from llama_stack.providers.utils.inference.openai_mixin import OpenAIMixin
 from llama_stack.providers.utils.inference.prompt_adapter import (
     completion_request_to_prompt,
     content_has_media,
@@ -288,7 +281,7 @@ async def _process_vllm_chat_completion_stream_response(
         yield c
 
 
-class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
+class VLLMInferenceAdapter(OpenAIMixin, Inference, ModelsProtocolPrivate):
     # automatically set by the resolver when instantiating the provider
     __provider_id__: str
     model_store: ModelStore | None = None
@@ -296,7 +289,6 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
     def __init__(self, config: VLLMInferenceAdapterConfig) -> None:
         self.register_helper = ModelRegistryHelper(build_hf_repo_model_entries())
         self.config = config
-        self.client = None
 
     async def initialize(self) -> None:
         if not self.config.url:
@@ -308,8 +300,6 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
         return self.config.refresh_models
 
     async def list_models(self) -> list[Model] | None:
-        self._lazy_initialize_client()
-        assert self.client is not None  # mypy
         models = []
         async for m in self.client.models.list():
             model_type = ModelType.llm  # unclear how to determine embedding vs. llm models
@@ -340,8 +330,7 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
             HealthResponse: A dictionary containing the health status.
         """
         try:
-            client = self._create_client() if self.client is None else self.client
-            _ = [m async for m in client.models.list()]  # Ensure the client is initialized
+            _ = [m async for m in self.client.models.list()]  # Ensure the client is initialized
             return HealthResponse(status=HealthStatus.OK)
         except Exception as e:
             return HealthResponse(status=HealthStatus.ERROR, message=f"Health check failed: {str(e)}")
@@ -351,19 +340,14 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
             raise ValueError("Model store not set")
         return await self.model_store.get_model(model_id)
 
-    def _lazy_initialize_client(self):
-        if self.client is not None:
-            return
+    def get_api_key(self):
+        return self.config.api_token
 
-        log.info(f"Initializing vLLM client with base_url={self.config.url}")
-        self.client = self._create_client()
+    def get_base_url(self):
+        return self.config.url
 
-    def _create_client(self):
-        return AsyncOpenAI(
-            base_url=self.config.url,
-            api_key=self.config.api_token,
-            http_client=httpx.AsyncClient(verify=self.config.tls_verify),
-        )
+    def get_extra_client_params(self):
+        return {"http_client": httpx.AsyncClient(verify=self.config.tls_verify)}
 
     async def completion(
         self,
@@ -374,7 +358,6 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
         stream: bool | None = False,
         logprobs: LogProbConfig | None = None,
     ) -> CompletionResponse | AsyncGenerator[CompletionResponseStreamChunk, None]:
-        self._lazy_initialize_client()
         if sampling_params is None:
             sampling_params = SamplingParams()
         model = await self._get_model(model_id)
@@ -406,7 +389,6 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
         logprobs: LogProbConfig | None = None,
         tool_config: ToolConfig | None = None,
     ) -> ChatCompletionResponse | AsyncGenerator[ChatCompletionResponseStreamChunk, None]:
-        self._lazy_initialize_client()
         if sampling_params is None:
             sampling_params = SamplingParams()
         model = await self._get_model(model_id)
@@ -479,16 +461,12 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
             yield chunk
 
     async def register_model(self, model: Model) -> Model:
-        # register_model is called during Llama Stack initialization, hence we cannot init self.client if not initialized yet.
-        # self.client should only be created after the initialization is complete to avoid asyncio cross-context errors.
-        # Changing this may lead to unpredictable behavior.
-        client = self._create_client() if self.client is None else self.client
         try:
             model = await self.register_helper.register_model(model)
         except ValueError:
             pass  # Ignore statically unknown model, will check live listing
         try:
-            res = await client.models.list()
+            res = await self.client.models.list()
         except APIConnectionError as e:
             raise ValueError(
                 f"Failed to connect to vLLM at {self.config.url}. Please check if vLLM is running and accessible at that URL."
@@ -543,8 +521,6 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
         output_dimension: int | None = None,
         task_type: EmbeddingTaskType | None = None,
     ) -> EmbeddingsResponse:
-        self._lazy_initialize_client()
-        assert self.client is not None
         model = await self._get_model(model_id)
 
         kwargs = {}
@@ -560,154 +536,3 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
 
         embeddings = [data.embedding for data in response.data]
         return EmbeddingsResponse(embeddings=embeddings)
-
-    async def openai_embeddings(
-        self,
-        model: str,
-        input: str | list[str],
-        encoding_format: str | None = "float",
-        dimensions: int | None = None,
-        user: str | None = None,
-    ) -> OpenAIEmbeddingsResponse:
-        self._lazy_initialize_client()
-        assert self.client is not None
-        model_obj = await self._get_model(model)
-        assert model_obj.model_type == ModelType.embedding
-
-        # Convert input to list if it's a string
-        input_list = [input] if isinstance(input, str) else input
-
-        # Call vLLM embeddings endpoint with encoding_format
-        response = await self.client.embeddings.create(
-            model=model_obj.provider_resource_id,
-            input=input_list,
-            dimensions=dimensions,
-            encoding_format=encoding_format,
-        )
-
-        # Convert response to OpenAI format
-        data = [
-            OpenAIEmbeddingData(
-                embedding=embedding_data.embedding,
-                index=i,
-            )
-            for i, embedding_data in enumerate(response.data)
-        ]
-
-        # Not returning actual token usage since vLLM doesn't provide it
-        usage = OpenAIEmbeddingUsage(prompt_tokens=-1, total_tokens=-1)
-
-        return OpenAIEmbeddingsResponse(
-            data=data,
-            model=model_obj.provider_resource_id,
-            usage=usage,
-        )
-
-    async def openai_completion(
-        self,
-        model: str,
-        prompt: str | list[str] | list[int] | list[list[int]],
-        best_of: int | None = None,
-        echo: bool | None = None,
-        frequency_penalty: float | None = None,
-        logit_bias: dict[str, float] | None = None,
-        logprobs: bool | None = None,
-        max_tokens: int | None = None,
-        n: int | None = None,
-        presence_penalty: float | None = None,
-        seed: int | None = None,
-        stop: str | list[str] | None = None,
-        stream: bool | None = None,
-        stream_options: dict[str, Any] | None = None,
-        temperature: float | None = None,
-        top_p: float | None = None,
-        user: str | None = None,
-        guided_choice: list[str] | None = None,
-        prompt_logprobs: int | None = None,
-        suffix: str | None = None,
-    ) -> OpenAICompletion:
-        self._lazy_initialize_client()
-        model_obj = await self._get_model(model)
-
-        extra_body: dict[str, Any] = {}
-        if prompt_logprobs is not None and prompt_logprobs >= 0:
-            extra_body["prompt_logprobs"] = prompt_logprobs
-        if guided_choice:
-            extra_body["guided_choice"] = guided_choice
-
-        params = await prepare_openai_completion_params(
-            model=model_obj.provider_resource_id,
-            prompt=prompt,
-            best_of=best_of,
-            echo=echo,
-            frequency_penalty=frequency_penalty,
-            logit_bias=logit_bias,
-            logprobs=logprobs,
-            max_tokens=max_tokens,
-            n=n,
-            presence_penalty=presence_penalty,
-            seed=seed,
-            stop=stop,
-            stream=stream,
-            stream_options=stream_options,
-            temperature=temperature,
-            top_p=top_p,
-            user=user,
-            extra_body=extra_body,
-        )
-        return await self.client.completions.create(**params)  # type: ignore
-
-    async def openai_chat_completion(
-        self,
-        model: str,
-        messages: list[OpenAIMessageParam],
-        frequency_penalty: float | None = None,
-        function_call: str | dict[str, Any] | None = None,
-        functions: list[dict[str, Any]] | None = None,
-        logit_bias: dict[str, float] | None = None,
-        logprobs: bool | None = None,
-        max_completion_tokens: int | None = None,
-        max_tokens: int | None = None,
-        n: int | None = None,
-        parallel_tool_calls: bool | None = None,
-        presence_penalty: float | None = None,
-        response_format: OpenAIResponseFormatParam | None = None,
-        seed: int | None = None,
-        stop: str | list[str] | None = None,
-        stream: bool | None = None,
-        stream_options: dict[str, Any] | None = None,
-        temperature: float | None = None,
-        tool_choice: str | dict[str, Any] | None = None,
-        tools: list[dict[str, Any]] | None = None,
-        top_logprobs: int | None = None,
-        top_p: float | None = None,
-        user: str | None = None,
-    ) -> OpenAIChatCompletion | AsyncIterator[OpenAIChatCompletionChunk]:
-        self._lazy_initialize_client()
-        model_obj = await self._get_model(model)
-        params = await prepare_openai_completion_params(
-            model=model_obj.provider_resource_id,
-            messages=messages,
-            frequency_penalty=frequency_penalty,
-            function_call=function_call,
-            functions=functions,
-            logit_bias=logit_bias,
-            logprobs=logprobs,
-            max_completion_tokens=max_completion_tokens,
-            max_tokens=max_tokens,
-            n=n,
-            parallel_tool_calls=parallel_tool_calls,
-            presence_penalty=presence_penalty,
-            response_format=response_format,
-            seed=seed,
-            stop=stop,
-            stream=stream,
-            stream_options=stream_options,
-            temperature=temperature,
-            tool_choice=tool_choice,
-            tools=tools,
-            top_logprobs=top_logprobs,
-            top_p=top_p,
-            user=user,
-        )
-        return await self.client.chat.completions.create(**params)  # type: ignore
diff --git a/llama_stack/providers/utils/inference/openai_mixin.py b/llama_stack/providers/utils/inference/openai_mixin.py
index f60deee6e..a3c0ffadc 100644
--- a/llama_stack/providers/utils/inference/openai_mixin.py
+++ b/llama_stack/providers/utils/inference/openai_mixin.py
@@ -67,6 +67,17 @@ class OpenAIMixin(ABC):
         """
         pass
 
+    def get_extra_client_params(self) -> dict[str, Any]:
+        """
+        Get any extra parameters to pass to the AsyncOpenAI client.
+
+        Child classes can override this method to provide additional parameters
+        such as timeout settings, proxies, etc.
+
+        :return: A dictionary of extra parameters
+        """
+        return {}
+
     @property
     def client(self) -> AsyncOpenAI:
         """
@@ -78,6 +89,7 @@ class OpenAIMixin(ABC):
         return AsyncOpenAI(
             api_key=self.get_api_key(),
             base_url=self.get_base_url(),
+            **self.get_extra_client_params(),
         )
 
     async def _get_provider_model_id(self, model: str) -> str:
@@ -124,10 +136,15 @@ class OpenAIMixin(ABC):
         """
         Direct OpenAI completion API call.
         """
-        if guided_choice is not None:
-            logger.warning("guided_choice is not supported by the OpenAI API. Ignoring.")
-        if prompt_logprobs is not None:
-            logger.warning("prompt_logprobs is not supported by the OpenAI API. Ignoring.")
+        # Handle parameters that are not supported by OpenAI API, but may be by the provider
+        #  prompt_logprobs is supported by vLLM
+        #  guided_choice is supported by vLLM
+        # TODO: test coverage
+        extra_body: dict[str, Any] = {}
+        if prompt_logprobs is not None and prompt_logprobs >= 0:
+            extra_body["prompt_logprobs"] = prompt_logprobs
+        if guided_choice:
+            extra_body["guided_choice"] = guided_choice
 
         # TODO: fix openai_completion to return type compatible with OpenAI's API response
         return await self.client.completions.create(  # type: ignore[no-any-return]
@@ -150,7 +167,8 @@ class OpenAIMixin(ABC):
                 top_p=top_p,
                 user=user,
                 suffix=suffix,
-            )
+            ),
+            extra_body=extra_body,
         )
 
     async def openai_chat_completion(
diff --git a/tests/unit/providers/inference/test_remote_vllm.py b/tests/unit/providers/inference/test_remote_vllm.py
index ce0e930b1..a48af2a1d 100644
--- a/tests/unit/providers/inference/test_remote_vllm.py
+++ b/tests/unit/providers/inference/test_remote_vllm.py
@@ -11,7 +11,7 @@ import threading
 import time
 from http.server import BaseHTTPRequestHandler, HTTPServer
 from typing import Any
-from unittest.mock import AsyncMock, MagicMock, patch
+from unittest.mock import AsyncMock, MagicMock, PropertyMock, patch
 
 import pytest
 from openai.types.chat.chat_completion_chunk import (
@@ -150,10 +150,12 @@ async def test_tool_call_response(vllm_inference_adapter):
     """Verify that tool call arguments from a CompletionMessage are correctly converted
     into the expected JSON format."""
 
-    # Patch the call to vllm so we can inspect the arguments sent were correct
-    with patch.object(
-        vllm_inference_adapter.client.chat.completions, "create", new_callable=AsyncMock
-    ) as mock_nonstream_completion:
+    # Patch the client property to avoid instantiating a real AsyncOpenAI client
+    with patch.object(VLLMInferenceAdapter, "client", new_callable=PropertyMock) as mock_create_client:
+        mock_client = MagicMock()
+        mock_client.chat.completions.create = AsyncMock()
+        mock_create_client.return_value = mock_client
+
         messages = [
             SystemMessage(content="You are a helpful assistant"),
             UserMessage(content="How many?"),
@@ -179,7 +181,7 @@ async def test_tool_call_response(vllm_inference_adapter):
             tool_config=ToolConfig(tool_choice=ToolChoice.auto),
         )
 
-        assert mock_nonstream_completion.call_args.kwargs["messages"][2]["tool_calls"] == [
+        assert mock_client.chat.completions.create.call_args.kwargs["messages"][2]["tool_calls"] == [
             {
                 "id": "foo",
                 "type": "function",
@@ -641,9 +643,7 @@ async def test_health_status_success(vllm_inference_adapter):
     This test verifies that the health method returns a HealthResponse with status OK, only
     when the connection to the vLLM server is successful.
     """
-    # Set vllm_inference_adapter.client to None to ensure _create_client is called
-    vllm_inference_adapter.client = None
-    with patch.object(vllm_inference_adapter, "_create_client") as mock_create_client:
+    with patch.object(VLLMInferenceAdapter, "client", new_callable=PropertyMock) as mock_create_client:
         # Create mock client and models
         mock_client = MagicMock()
         mock_models = MagicMock()
@@ -674,8 +674,7 @@ async def test_health_status_failure(vllm_inference_adapter):
     This test verifies that the health method returns a HealthResponse with status ERROR
     and an appropriate error message when the connection to the vLLM server fails.
     """
-    vllm_inference_adapter.client = None
-    with patch.object(vllm_inference_adapter, "_create_client") as mock_create_client:
+    with patch.object(VLLMInferenceAdapter, "client", new_callable=PropertyMock) as mock_create_client:
         # Create mock client and models
         mock_client = MagicMock()
         mock_models = MagicMock()

From 72387b4bd229bba60b43f95679da62630fc0f3c7 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Thu, 11 Sep 2025 11:45:16 -0400
Subject: [PATCH 76/76] chore(unit tests): remove network use, update async
 test (#3418)

# What does this PR do?

update the async detection test for vllm

- remove a network access from unit tests
- remove direct logging use

the idea behind the test is to mock inference w/ a sleep, initiate
concurrent inference calls, verify the total execution time is close to
the sleep time. in a non-async env the total time would be closer to
sleep * num concurrent calls.


## Test Plan

ci
---
 .../providers/inference/test_remote_vllm.py   | 160 +++++++-----------
 1 file changed, 60 insertions(+), 100 deletions(-)

diff --git a/tests/unit/providers/inference/test_remote_vllm.py b/tests/unit/providers/inference/test_remote_vllm.py
index a48af2a1d..61b16b5d1 100644
--- a/tests/unit/providers/inference/test_remote_vllm.py
+++ b/tests/unit/providers/inference/test_remote_vllm.py
@@ -6,11 +6,7 @@
 
 import asyncio
 import json
-import logging  # allow-direct-logging
-import threading
 import time
-from http.server import BaseHTTPRequestHandler, HTTPServer
-from typing import Any
 from unittest.mock import AsyncMock, MagicMock, PropertyMock, patch
 
 import pytest
@@ -18,7 +14,7 @@ from openai.types.chat.chat_completion_chunk import (
     ChatCompletionChunk as OpenAIChatCompletionChunk,
 )
 from openai.types.chat.chat_completion_chunk import (
-    Choice as OpenAIChoice,
+    Choice as OpenAIChoiceChunk,
 )
 from openai.types.chat.chat_completion_chunk import (
     ChoiceDelta as OpenAIChoiceDelta,
@@ -35,6 +31,9 @@ from llama_stack.apis.inference import (
     ChatCompletionRequest,
     ChatCompletionResponseEventType,
     CompletionMessage,
+    OpenAIAssistantMessageParam,
+    OpenAIChatCompletion,
+    OpenAIChoice,
     SystemMessage,
     ToolChoice,
     ToolConfig,
@@ -61,41 +60,6 @@ from llama_stack.providers.remote.inference.vllm.vllm import (
 # -v -s --tb=short --disable-warnings
 
 
-class MockInferenceAdapterWithSleep:
-    def __init__(self, sleep_time: int, response: dict[str, Any]):
-        self.httpd = None
-
-        class DelayedRequestHandler(BaseHTTPRequestHandler):
-            # ruff: noqa: N802
-            def do_POST(self):
-                time.sleep(sleep_time)
-                response_body = json.dumps(response).encode("utf-8")
-                self.send_response(code=200)
-                self.send_header("Content-Type", "application/json")
-                self.send_header("Content-Length", len(response_body))
-                self.end_headers()
-                self.wfile.write(response_body)
-
-        self.request_handler = DelayedRequestHandler
-
-    def __enter__(self):
-        httpd = HTTPServer(("", 0), self.request_handler)
-        self.httpd = httpd
-        host, port = httpd.server_address
-        httpd_thread = threading.Thread(target=httpd.serve_forever)
-        httpd_thread.daemon = True  # stop server if this thread terminates
-        httpd_thread.start()
-
-        config = VLLMInferenceAdapterConfig(url=f"http://{host}:{port}")
-        inference_adapter = VLLMInferenceAdapter(config)
-        return inference_adapter
-
-    def __exit__(self, _exc_type, _exc_value, _traceback):
-        if self.httpd:
-            self.httpd.shutdown()
-            self.httpd.server_close()
-
-
 @pytest.fixture(scope="module")
 def mock_openai_models_list():
     with patch("openai.resources.models.AsyncModels.list", new_callable=AsyncMock) as mock_list:
@@ -201,7 +165,7 @@ async def test_tool_call_delta_empty_tool_call_buf():
 
     async def mock_stream():
         delta = OpenAIChoiceDelta(content="", tool_calls=None)
-        choices = [OpenAIChoice(delta=delta, finish_reason="stop", index=0)]
+        choices = [OpenAIChoiceChunk(delta=delta, finish_reason="stop", index=0)]
         mock_chunk = OpenAIChatCompletionChunk(
             id="chunk-1",
             created=1,
@@ -227,7 +191,7 @@ async def test_tool_call_delta_streaming_arguments_dict():
             model="foo",
             object="chat.completion.chunk",
             choices=[
-                OpenAIChoice(
+                OpenAIChoiceChunk(
                     delta=OpenAIChoiceDelta(
                         content="",
                         tool_calls=[
@@ -252,7 +216,7 @@ async def test_tool_call_delta_streaming_arguments_dict():
             model="foo",
             object="chat.completion.chunk",
             choices=[
-                OpenAIChoice(
+                OpenAIChoiceChunk(
                     delta=OpenAIChoiceDelta(
                         content="",
                         tool_calls=[
@@ -277,7 +241,9 @@ async def test_tool_call_delta_streaming_arguments_dict():
             model="foo",
             object="chat.completion.chunk",
             choices=[
-                OpenAIChoice(delta=OpenAIChoiceDelta(content="", tool_calls=None), finish_reason="tool_calls", index=0)
+                OpenAIChoiceChunk(
+                    delta=OpenAIChoiceDelta(content="", tool_calls=None), finish_reason="tool_calls", index=0
+                )
             ],
         )
         for chunk in [mock_chunk_1, mock_chunk_2, mock_chunk_3]:
@@ -301,7 +267,7 @@ async def test_multiple_tool_calls():
             model="foo",
             object="chat.completion.chunk",
             choices=[
-                OpenAIChoice(
+                OpenAIChoiceChunk(
                     delta=OpenAIChoiceDelta(
                         content="",
                         tool_calls=[
@@ -326,7 +292,7 @@ async def test_multiple_tool_calls():
             model="foo",
             object="chat.completion.chunk",
             choices=[
-                OpenAIChoice(
+                OpenAIChoiceChunk(
                     delta=OpenAIChoiceDelta(
                         content="",
                         tool_calls=[
@@ -351,7 +317,9 @@ async def test_multiple_tool_calls():
             model="foo",
             object="chat.completion.chunk",
             choices=[
-                OpenAIChoice(delta=OpenAIChoiceDelta(content="", tool_calls=None), finish_reason="tool_calls", index=0)
+                OpenAIChoiceChunk(
+                    delta=OpenAIChoiceDelta(content="", tool_calls=None), finish_reason="tool_calls", index=0
+                )
             ],
         )
         for chunk in [mock_chunk_1, mock_chunk_2, mock_chunk_3]:
@@ -395,59 +363,6 @@ async def test_process_vllm_chat_completion_stream_response_no_choices():
     assert chunks[0].event.event_type.value == "start"
 
 
-@pytest.mark.allow_network
-def test_chat_completion_doesnt_block_event_loop(caplog):
-    loop = asyncio.new_event_loop()
-    loop.set_debug(True)
-    caplog.set_level(logging.WARNING)
-
-    # Log when event loop is blocked for more than 200ms
-    loop.slow_callback_duration = 0.5
-    # Sleep for 500ms in our delayed http response
-    sleep_time = 0.5
-
-    mock_model = Model(identifier="mock-model", provider_resource_id="mock-model", provider_id="vllm-inference")
-    mock_response = {
-        "id": "chatcmpl-abc123",
-        "object": "chat.completion",
-        "created": 1,
-        "modle": "mock-model",
-        "choices": [
-            {
-                "message": {"content": ""},
-                "logprobs": None,
-                "finish_reason": "stop",
-                "index": 0,
-            }
-        ],
-    }
-
-    async def do_chat_completion():
-        await inference_adapter.chat_completion(
-            "mock-model",
-            [],
-            stream=False,
-            tools=None,
-            tool_config=ToolConfig(tool_choice=ToolChoice.auto),
-        )
-
-    with MockInferenceAdapterWithSleep(sleep_time, mock_response) as inference_adapter:
-        inference_adapter.model_store = AsyncMock()
-        inference_adapter.model_store.get_model.return_value = mock_model
-        loop.run_until_complete(inference_adapter.initialize())
-
-        # Clear the logs so far and run the actual chat completion we care about
-        caplog.clear()
-        loop.run_until_complete(do_chat_completion())
-
-    # Ensure we don't have any asyncio warnings in the captured log
-    # records from our chat completion call. A message gets logged
-    # here any time we exceed the slow_callback_duration configured
-    # above.
-    asyncio_warnings = [record.message for record in caplog.records if record.name == "asyncio"]
-    assert not asyncio_warnings
-
-
 async def test_get_params_empty_tools(vllm_inference_adapter):
     request = ChatCompletionRequest(
         tools=[],
@@ -696,3 +611,48 @@ async def test_health_status_failure(vllm_inference_adapter):
         assert "Health check failed: Connection failed" in health_response["message"]
 
         mock_models.list.assert_called_once()
+
+
+async def test_openai_chat_completion_is_async(vllm_inference_adapter):
+    """
+    Verify that openai_chat_completion is async and doesn't block the event loop.
+
+    To do this we mock the underlying inference with a sleep, start multiple
+    inference calls in parallel, and ensure the total time taken is less
+    than the sum of the individual sleep times.
+    """
+    sleep_time = 0.5
+
+    async def mock_create(*args, **kwargs):
+        await asyncio.sleep(sleep_time)
+        return OpenAIChatCompletion(
+            id="chatcmpl-abc123",
+            created=1,
+            model="mock-model",
+            choices=[
+                OpenAIChoice(
+                    message=OpenAIAssistantMessageParam(
+                        content="nothing interesting",
+                    ),
+                    finish_reason="stop",
+                    index=0,
+                )
+            ],
+        )
+
+    async def do_inference():
+        await vllm_inference_adapter.openai_chat_completion(
+            "mock-model", messages=["one fish", "two fish"], stream=False
+        )
+
+    with patch.object(VLLMInferenceAdapter, "client", new_callable=PropertyMock) as mock_create_client:
+        mock_client = MagicMock()
+        mock_client.chat.completions.create = AsyncMock(side_effect=mock_create)
+        mock_create_client.return_value = mock_client
+
+        start_time = time.time()
+        await asyncio.gather(do_inference(), do_inference(), do_inference(), do_inference())
+        total_time = time.time() - start_time
+
+        assert mock_create_client.call_count == 4  # no cheating
+        assert total_time < (sleep_time * 2), f"Total time taken: {total_time}s exceeded expected max"