feat(tests): auto-merge all model list responses and unify recordings (#3320)

One needed to specify record-replay related environment variables for running integration tests. We could not use defaults because integration tests could be run against Ollama instances which could be running different models. For example, text vs vision tests needed separate instances of Ollama because a single instance typically cannot serve both of these models if you assume the standard CI worker configuration on Github. As a result, `client.list()` as returned by the Ollama client would be different between these runs and we'd end up overwriting responses. This PR "solves" it by adding a small amount of complexity -- we store model list responses specially, keyed by the hashes of the models they return. At replay time, we merge all of them and pretend that we have the union of all models available. ## Test Plan Re-recorded all the tests using `scripts/integration-tests.sh --inference-mode record`, including the vision tests.
2025-10-04 04:04:14 +00:00 · 2025-09-03 11:33:03 -07:00 · 2025-09-03 11:33:03 -07:00 · c3d3a0b833
commit c3d3a0b833
parent d948e63340
122 changed files with 17460 additions and 16129 deletions
--- a/tests/integration/recordings/responses/0b3f2e4754ff.json
+++ b/tests/integration/recordings/responses/0b3f2e4754ff.json
@ -24,7 +24,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -39,7 +39,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921333,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
@ -50,7 +50,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -65,7 +65,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921333,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
@ -76,7 +76,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -91,7 +91,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921333,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
@ -102,7 +102,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -117,7 +117,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921333,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
@ -128,7 +128,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -143,7 +143,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921334,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
@ -154,7 +154,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -169,7 +169,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921334,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
@ -180,7 +180,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -195,7 +195,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921334,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
@ -206,7 +206,7 @@
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
-          "id": "chatcmpl-29",
+          "id": "chatcmpl-414",
          "choices": [
            {
              "delta": {
@ -221,7 +221,7 @@
              "logprobs": null
            }
          ],
-          "created": 1754090031,
+          "created": 1756921334,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,