feat(tests): implement test isolation for inference recordings (#3681)

Uses test_id in request hashes and test-scoped subdirectories to prevent
cross-test contamination. Model list endpoints exclude test_id to enable
merging recordings from different servers.

Additionally, this PR adds a `record-if-missing` mode (which we will use
instead of `record` which records everything) which is very useful.

🤖 Co-authored with [Claude Code](https://claude.com/claude-code)

---------

Co-authored-by: Claude <noreply@anthropic.com>
This commit is contained in:
Ashwin Bharambe 2025-10-04 11:34:18 -07:00 committed by GitHub
parent f176196fba
commit 045a0c1d57
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
428 changed files with 85345 additions and 104330 deletions

File diff suppressed because one or more lines are too long

File diff suppressed because one or more lines are too long

View file

@ -0,0 +1,422 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_user_parameter[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/embeddings",
"headers": {},
"body": {
"model": "all-minilm:l6-v2",
"input": "Test user parameter",
"encoding_format": "float",
"user": "test-user-123"
},
"endpoint": "/v1/embeddings",
"model": "all-minilm:l6-v2"
},
"response": {
"body": {
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
"__data__": {
"data": [
{
"embedding": [
0.043779343,
0.021533398,
-0.081306435,
0.010584965,
-0.079082854,
-0.03219143,
0.13092613,
0.04234389,
-0.11600539,
-0.07588513,
0.04182356,
-0.08061255,
0.038127176,
-0.010701234,
0.015768763,
-0.04193689,
0.04310592,
-0.033361685,
0.013566423,
-0.010392366,
0.015551022,
-0.037858423,
-0.050305344,
-0.025666261,
-0.047879875,
-0.087179765,
0.016856788,
-0.036765736,
0.006393739,
0.020844297,
0.11262393,
-0.002143682,
-0.07910913,
0.038748607,
0.11532516,
-0.019759571,
0.0066967797,
-0.021164352,
-0.014471563,
-0.0027048697,
-0.034388524,
-0.052571636,
-0.030607725,
0.04747725,
-0.02431059,
0.0109337615,
-0.03946421,
0.071846664,
-0.020690937,
0.01898796,
0.042931512,
-0.0077551426,
0.0025911122,
-0.058268107,
0.0117475465,
-0.022701943,
0.0017815019,
-0.012612941,
0.030724185,
0.017728312,
-0.06155491,
-0.03656162,
0.02583153,
0.02537894,
0.012139213,
0.009105951,
-0.027318193,
-0.093389414,
0.005184693,
0.007488449,
-0.07540277,
0.010159999,
-0.028444426,
0.030260745,
0.0036438918,
-0.022627153,
-0.037846327,
-0.08381657,
-0.012445195,
-0.048908208,
0.029149827,
-0.044437535,
-0.07520237,
-0.020924438,
0.06342514,
0.1629199,
0.060563333,
-0.012817673,
-0.031030292,
0.018368995,
0.11223112,
0.07292473,
-0.062686674,
-0.031803295,
-0.017489262,
0.048433464,
-0.041148387,
-0.04183779,
-0.05994369,
0.15909556,
-0.027785666,
-0.012455991,
0.056005318,
-0.019891974,
0.022063067,
0.006342065,
0.0464118,
-0.07311654,
0.033282198,
0.05949105,
-0.033307947,
0.030738499,
0.008186239,
-0.020268966,
0.056593496,
-0.081526734,
0.023390312,
0.0060836566,
-0.07992586,
0.013986445,
0.052250065,
0.027186505,
-0.049284942,
0.028148174,
0.019493744,
0.05418436,
0.0827222,
-1.8825437e-33,
0.01360945,
-0.010870715,
0.015887791,
0.069373555,
-0.051129147,
0.08999179,
0.044494778,
0.08100757,
0.018944906,
-0.020974122,
-0.017938385,
-0.021756735,
0.010972489,
0.015099965,
0.017018452,
0.094338946,
0.0034407445,
0.010244923,
-0.044709302,
0.0018059182,
0.015817573,
-0.065777056,
-0.004948138,
0.0044092103,
-0.019589791,
-0.092789896,
-0.025898295,
0.044104066,
0.0541385,
-0.007362511,
-0.021487307,
-0.036836285,
-0.09148704,
0.084001675,
-0.018094191,
0.003797567,
0.020257449,
0.04394643,
-0.0772898,
0.0057312953,
-0.054519102,
-0.024835315,
0.0753162,
0.034552757,
-0.081203006,
-0.12210961,
-0.0053012627,
0.00780717,
0.050265096,
0.015569535,
-0.056362487,
0.039800324,
0.013022089,
-0.04015537,
0.014401654,
-0.033209093,
-0.008451782,
-0.037590392,
-0.01965779,
0.01730637,
-0.00896531,
-0.0018413392,
-0.0030382746,
0.030460354,
-0.05112036,
-0.086875,
-0.018338922,
-0.11328767,
0.07325826,
0.046035297,
0.012633494,
-0.06343216,
-0.028439038,
0.020128354,
-0.07883383,
-0.00069870794,
-0.03155447,
0.12306934,
0.004300722,
-0.026421167,
0.078361824,
-0.077461444,
-0.021267027,
0.048929654,
0.02919381,
-0.0092880055,
-0.030666346,
-0.04102384,
-0.03860138,
-0.08042292,
0.023227168,
0.04191858,
-0.058156747,
0.0585743,
0.076342255,
4.465569e-34,
-0.019599343,
0.040230304,
0.01455632,
0.034345042,
0.04392999,
-0.023241352,
0.067749046,
-0.03010354,
-0.09075954,
-0.019227842,
-0.027724287,
-0.00062344945,
0.0042892746,
0.053643614,
0.04075099,
0.032581333,
-0.107116826,
-0.0500636,
-0.016655827,
-0.007782394,
-0.111523,
0.07476429,
-0.016019335,
-0.050536986,
-0.11320647,
-0.0061384854,
0.050886273,
-0.030283457,
0.04318923,
0.03301474,
0.02362771,
0.046507858,
-0.03416386,
0.036145207,
0.023037339,
-0.026803765,
0.06361122,
0.09975251,
0.035269737,
0.1554014,
0.083479255,
0.10931981,
0.046847064,
-0.010136355,
-0.032541983,
0.12926093,
0.031193413,
-0.09971323,
0.010830718,
0.02325219,
-0.011917061,
0.010155018,
0.06883269,
0.009340846,
-0.022698723,
-0.042815465,
-0.048211087,
-0.085067384,
0.05105234,
0.045155898,
-0.03564869,
0.06549556,
0.048875004,
0.037915554,
-0.14071068,
-0.067095764,
0.009898252,
-0.0049653547,
-0.044304688,
0.0039006064,
-0.026903173,
-0.066124685,
0.040738244,
-0.052228633,
0.060485654,
-0.041119356,
-0.04312945,
-0.025152665,
0.08556276,
-0.044942576,
0.06393979,
-0.024227533,
-0.05052092,
-0.0020624825,
-0.078943975,
0.0026753,
0.02068896,
0.102683865,
-0.01237572,
0.056172684,
0.06552171,
0.030940128,
-0.07721113,
-0.061241012,
-0.016143149,
-1.3511957e-08,
-0.050416306,
-0.033628013,
0.046722032,
0.04744138,
-0.04411888,
0.04631675,
-0.0060847937,
-0.053873356,
0.013075445,
0.050437532,
-0.009895477,
-0.0041795173,
0.07229928,
0.021081135,
0.02672776,
-0.07482113,
-0.026757998,
0.052755926,
-0.034690056,
0.039811596,
-0.016370349,
0.045900222,
-0.02250936,
0.023861,
0.04912799,
0.09111738,
-0.0024878879,
0.049395334,
-0.03861115,
0.020867983,
0.076049894,
0.084881924,
-0.051956687,
-0.06878504,
-0.061384037,
0.077220954,
-0.06454818,
0.044513144,
0.008181126,
0.015890416,
-0.04280811,
0.005317184,
0.0034429359,
0.0031937633,
-0.013058055,
-0.09134677,
0.06425565,
-0.054977305,
0.0007087448,
-0.06258866,
-0.034974415,
-0.029966963,
0.044276785,
0.017868131,
-0.027976807,
-0.036579583,
0.021142753,
0.06057356,
-0.03133335,
-0.014331035,
0.034653842,
0.052315667,
-0.036585484,
0.028209662
],
"index": 0,
"object": "embedding"
}
],
"model": "all-minilm:l6-v2",
"object": "list",
"usage": {
"prompt_tokens": 3,
"total_tokens": 3
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,122 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Use one of the available tools"
}
],
"tools": [
{
"type": "function",
"function": {
"name": "simple",
"parameters": {
"type": "object",
"properties": {
"x": {
"type": "string"
}
}
}
}
},
{
"type": "function",
"function": {
"name": "complex",
"parameters": {
"type": "object",
"properties": {
"data": {
"$ref": "#/$defs/Complex"
}
},
"$defs": {
"Complex": {
"type": "object",
"properties": {
"nested": {
"type": "array",
"items": {
"type": "number"
}
}
}
}
}
}
}
},
{
"type": "function",
"function": {
"name": "with_output",
"parameters": {
"type": "object",
"properties": {
"input": {
"type": "string"
}
}
}
}
}
]
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-e0c71820f395",
"choices": [
{
"finish_reason": "tool_calls",
"index": 0,
"logprobs": null,
"message": {
"content": "",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": [
{
"id": "call_vxiwiifd",
"function": {
"arguments": "{\"x\":\"\"}",
"name": "simple"
},
"type": "function",
"index": 0
}
]
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 15,
"prompt_tokens": 246,
"total_tokens": 261,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_dimensions[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.143331-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,422 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_dimensions[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/embeddings",
"headers": {},
"body": {
"model": "all-minilm:l6-v2",
"input": "Test dimensions parameter",
"encoding_format": "float",
"dimensions": 16
},
"endpoint": "/v1/embeddings",
"model": "all-minilm:l6-v2"
},
"response": {
"body": {
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
"__data__": {
"data": [
{
"embedding": [
0.04635219,
0.002988263,
-0.054220885,
0.057812735,
-0.0340614,
0.013923248,
-0.005755826,
0.054555666,
-0.09073176,
-0.066910096,
0.046287432,
-0.060912322,
0.0010950539,
0.025724398,
-0.025169374,
-0.026821515,
-0.030190151,
0.0019341545,
-0.0754819,
0.057380512,
0.020332545,
-0.005591279,
-0.0022273492,
0.012063173,
-0.011033521,
-0.03300947,
0.05462081,
0.014426073,
0.024025004,
0.004224287,
0.09837723,
0.08385713,
-0.049175426,
0.03877149,
0.08748876,
-0.0223024,
0.006552746,
-0.0070359865,
0.017893821,
0.015465863,
0.05007282,
-0.019349905,
0.064887345,
0.03184605,
0.0034936152,
0.02317752,
-0.06297051,
0.044468515,
-0.022246253,
-0.017976552,
0.040390052,
-0.0020998395,
-0.05173264,
0.014722753,
0.01640469,
-0.06438627,
-0.043313596,
-0.040564552,
0.044412937,
-0.0031199565,
-0.007237415,
-0.05158015,
0.059660934,
-0.014839656,
0.012902056,
0.028181136,
-0.019578207,
-0.0664231,
-0.06333673,
0.028995825,
-0.114707075,
0.041575413,
-0.022128351,
0.01979776,
0.0630018,
0.011822141,
-0.06492722,
-0.066328146,
0.021114407,
-0.020638306,
-0.009599678,
0.013701863,
-0.060742326,
0.005395315,
0.026589092,
0.11719033,
0.067120634,
0.008300158,
0.036319703,
0.00772981,
0.071582936,
0.019818509,
-0.15945566,
0.047943458,
0.00031571978,
-0.04666597,
0.007148715,
-0.08839544,
0.038042437,
0.06620088,
0.034336157,
-0.035366412,
0.041598067,
0.073756054,
-0.018818064,
-0.017260034,
0.058635473,
-0.01371376,
0.048319146,
-0.023727186,
0.024134034,
0.015763162,
0.06681245,
0.01748244,
0.0825409,
-0.044568237,
0.0015441044,
-0.011225885,
0.0153481,
-0.061364066,
0.05792184,
0.044216745,
-0.047036964,
-0.02634555,
-0.033504363,
0.06713578,
0.030866034,
2.024336e-34,
-0.03532978,
0.021929236,
0.030160688,
0.09271786,
-0.010355268,
0.07196569,
0.052604284,
0.085753724,
0.094942175,
0.053786535,
-0.08900509,
-0.024382822,
-0.008744401,
-0.03167582,
0.01025236,
0.1818434,
-0.0022662894,
0.118558116,
-0.072208576,
-0.005867667,
0.0746222,
-0.024001855,
-0.013938801,
-0.030681474,
-0.029207803,
-0.117624186,
-0.046466038,
-0.002622228,
-0.0902171,
-0.038626853,
-0.037497964,
-0.02418436,
-0.069297835,
0.06424038,
0.0045628003,
-0.0041498984,
-0.01649947,
0.051125433,
-0.0058985935,
-0.0122523345,
-0.047424458,
-0.007806876,
0.07906618,
0.03244041,
-0.044682544,
-0.022625683,
0.028852794,
-0.050480433,
0.043801326,
-0.023512814,
-0.029832385,
0.031089257,
0.07129686,
-0.089649536,
0.011963804,
-0.018448317,
0.019637493,
0.020081993,
0.0012980831,
0.093201645,
-0.064436235,
-0.040581323,
-0.01193043,
0.043884862,
-0.010675756,
-0.030739127,
0.005605308,
-0.110498495,
0.044510514,
0.037110664,
0.04116233,
-0.039460793,
-0.04470639,
-0.027589805,
-0.02073358,
-0.067221105,
0.050390884,
0.031397663,
-0.008031462,
-0.009285899,
0.0013141648,
-0.017254544,
0.010367782,
-0.05940024,
-0.018042587,
-0.15487815,
0.0069424273,
-0.05208202,
0.0014201442,
-0.13956298,
-0.040203292,
0.027910054,
-0.064872995,
-0.016270144,
0.07052549,
5.3188943e-34,
0.012666737,
0.016728623,
-0.013163009,
0.06391275,
-0.043404065,
0.015435096,
0.03720438,
0.05997576,
-0.07789181,
-0.0408386,
0.024137221,
-0.019834999,
-0.034739267,
0.00042199617,
0.048484907,
0.08716056,
-0.101133205,
-0.07535088,
-0.03912376,
-0.031597532,
-0.052266575,
0.022085808,
-0.011040282,
0.005077135,
-0.088432744,
-0.010477913,
0.047780182,
-0.073345095,
0.014382301,
0.038075384,
0.02176859,
-0.029071847,
-0.036925532,
0.14317243,
0.020646103,
-0.08367964,
0.111576855,
-0.009943396,
0.023071144,
0.0926832,
0.011242715,
0.068017475,
-0.007714686,
0.03060742,
-0.011360289,
0.109015204,
0.12930514,
-0.07566831,
0.09001269,
-0.0090979,
0.0148039665,
0.048663232,
0.08894293,
0.038565516,
0.005821986,
0.016084671,
-0.106283545,
-0.033372246,
0.05440088,
-0.005663873,
0.0011572369,
-0.024969472,
0.043092247,
-0.009314855,
-0.11836073,
-0.027310666,
0.009811885,
-0.0052975323,
-0.044883158,
0.066436425,
-0.06750139,
-0.02696421,
0.01402391,
-0.04950559,
-0.084093384,
-0.07380851,
0.04709705,
4.9404687e-05,
0.01672617,
0.01849747,
0.027683195,
0.0047972985,
0.0017495222,
0.07066204,
-0.022430636,
0.06875498,
0.093927115,
0.11101308,
-0.015589739,
0.021178465,
0.033638563,
0.034676168,
-0.026882911,
-0.010514364,
0.0073013064,
-1.2070348e-08,
-0.10034882,
-0.028641108,
-0.061462097,
-0.009792086,
-0.081652306,
-0.011814046,
0.002039501,
0.010384326,
0.01639641,
0.09542911,
0.012538498,
-0.03542602,
0.018125113,
0.062750235,
0.0007333235,
-0.13612862,
-0.049830034,
0.021177148,
0.006589976,
0.007859552,
-0.03270378,
0.024738451,
-0.02542262,
-0.0033008803,
0.030640591,
-0.032442387,
0.04598555,
0.03903257,
0.035755396,
0.01686084,
0.13498692,
0.028296864,
-0.0035224769,
-0.036735818,
-0.046355885,
0.057701495,
0.008000554,
0.047822826,
0.04911064,
0.035214324,
-0.09817153,
0.0050856513,
-0.018094635,
-0.04385158,
0.06649695,
-0.037648164,
-0.006218895,
-0.037976924,
-0.0036204353,
-0.03149386,
0.031777944,
-0.011333557,
0.009081317,
0.022486951,
0.032106593,
0.023041077,
-0.06739943,
0.06294171,
-0.057333894,
-0.041295,
0.060841344,
0.03247397,
-0.05132725,
-0.04992364
],
"index": 0,
"object": "embedding"
}
],
"model": "all-minilm:l6-v2",
"object": "list",
"usage": {
"prompt_tokens": 3,
"total_tokens": 3
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,421 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_different_inputs_different_outputs[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/embeddings",
"headers": {},
"body": {
"model": "all-minilm:l6-v2",
"input": "This is the first text",
"encoding_format": "float"
},
"endpoint": "/v1/embeddings",
"model": "all-minilm:l6-v2"
},
"response": {
"body": {
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
"__data__": {
"data": [
{
"embedding": [
-0.0010839553,
0.067364,
0.015185306,
0.037240896,
0.029337138,
0.015160007,
0.0743005,
-0.0032980628,
0.06581814,
-0.021851996,
0.034412965,
0.051005766,
-0.011422501,
-0.025062356,
-0.051756065,
0.027193472,
0.07849549,
-0.05999108,
0.010471458,
-0.003400683,
0.043449093,
0.122919865,
9.668583e-05,
0.002153268,
0.018064681,
0.045069378,
-0.09762388,
0.11186886,
0.049657565,
-0.03485217,
-0.039568134,
0.003532146,
0.15894793,
0.06341193,
0.047953114,
0.011617699,
0.009799243,
0.015377702,
0.009379663,
0.079989135,
0.019207356,
-0.13718612,
0.01730099,
0.013687199,
0.014266827,
-0.00022628276,
-0.017710257,
0.02291068,
0.03590651,
-0.015361055,
-0.00978436,
-0.0401825,
-0.011481894,
0.00014050963,
0.08540761,
0.08730027,
0.0046967245,
0.006164595,
0.003031956,
0.008891807,
-0.006260525,
0.05061661,
0.0005252785,
0.0467754,
0.09363822,
-0.012814104,
0.017708639,
-0.062698044,
-0.11535818,
0.041123625,
-0.014939021,
0.044815876,
-0.020868087,
0.042999975,
-0.061038766,
0.019998673,
-0.068740115,
-0.035516046,
0.041884515,
0.012185281,
-0.029084096,
-0.06643917,
0.030638866,
0.05149607,
-0.12815061,
0.06821646,
-0.047070153,
-0.032925386,
0.007499353,
-0.017841771,
0.038296465,
-0.015792726,
0.07054022,
0.038072467,
-0.11428876,
0.04210153,
-0.11162366,
-0.045723915,
-0.028951947,
0.12735675,
-0.013946637,
-0.027157523,
0.07295939,
0.024098422,
-0.054050542,
-0.13125896,
0.03013205,
-0.023223283,
-0.019072957,
-0.007864101,
-0.021954412,
-0.05329901,
-0.07088355,
-0.0115214065,
-0.023399564,
-0.015638318,
0.05148062,
0.029261008,
0.06481798,
0.064031154,
0.014445124,
-0.058017716,
-0.069921836,
-0.023950975,
-0.08490842,
-0.08779567,
0.048162255,
-6.1240354e-33,
0.010315817,
0.038685724,
0.0031864564,
0.0357421,
0.0050265454,
-0.004210234,
-0.053900674,
-0.02988569,
-0.07548199,
-0.078777455,
-0.012271205,
-0.05056629,
0.020729113,
-0.051866043,
-0.059254467,
-0.059903424,
-0.055699438,
0.032196835,
-0.006328442,
-0.021668624,
-0.059921067,
0.0519611,
0.051227964,
-0.063502096,
-0.04873505,
-0.014265467,
0.0025537873,
-0.024346355,
-0.0055181426,
0.02007461,
-0.10196586,
0.010727814,
-0.023194604,
-0.081025146,
-0.014997581,
0.0017926424,
0.045078833,
-0.052792255,
-0.05368693,
-0.013245513,
-0.019808132,
0.020031843,
-0.00081401254,
-0.10117647,
-0.0007066768,
0.09663035,
-0.03946875,
0.04954661,
0.042237334,
0.007943922,
-0.05234212,
0.051887065,
0.03711589,
0.034850314,
0.063441575,
-0.026583876,
-0.009227281,
-0.0025737104,
-0.056082893,
0.0020716325,
-0.020129146,
0.0012315192,
-0.0017609745,
0.019111704,
0.016572498,
-0.011374,
0.010381644,
-0.007864189,
0.04664868,
-0.046856377,
-0.08523834,
-0.008974813,
0.012022968,
0.013285977,
0.015182303,
0.03708482,
0.026587088,
0.014473839,
-0.013946565,
0.01999883,
-0.06888259,
-0.07111367,
0.012369427,
0.032828625,
-0.03152666,
0.045777358,
0.06801705,
-0.07747748,
0.018461134,
0.06620267,
-0.086365156,
0.008950603,
0.041320425,
0.009541193,
0.0066037327,
4.71081e-33,
-0.026172558,
0.0013145636,
-0.014140948,
-0.024360213,
0.06931815,
0.031448748,
0.037257418,
0.06468137,
0.049403396,
0.11072201,
0.04985356,
0.06679111,
0.04153249,
-0.034106053,
0.070283465,
0.034855895,
0.12902643,
-0.021033453,
0.008940618,
0.030177405,
-0.022881329,
0.036504544,
-0.13194299,
0.045612644,
-0.0127895875,
0.04174139,
0.1232064,
-0.013484046,
-0.007285246,
-0.029776007,
0.025007037,
-0.009516822,
0.02475585,
0.023208592,
-0.019141924,
0.02259424,
0.013740329,
-0.038490705,
-0.014461541,
0.075218394,
0.13589163,
0.009839605,
-0.037563317,
-0.02737327,
-0.016485116,
-0.048845276,
-0.03523722,
-0.05439929,
-0.0017957076,
0.03563579,
-0.010255764,
-0.01859244,
-0.03647324,
-0.055985246,
-0.007833892,
0.009086756,
-0.007333394,
0.050386623,
-0.0002305643,
-0.03637248,
-0.024937423,
0.058877032,
-0.07250415,
0.07401245,
0.053917013,
-0.051895224,
-0.006332244,
0.07850189,
-0.01695057,
-0.006673017,
0.012659739,
-0.014127065,
-0.13639799,
-0.08524976,
-0.017533274,
-0.0046930755,
0.013687301,
0.0009185522,
-0.0719948,
-0.06887779,
0.14208324,
0.03187123,
-0.055919908,
0.030401653,
0.061900012,
0.029921472,
-0.00096237566,
-0.065010294,
-0.020657646,
0.039562404,
-0.123846576,
0.0028867351,
0.051196404,
0.13397509,
-0.088453874,
-1.7590333e-08,
-0.025786474,
-0.080303885,
-0.09164947,
0.031999,
0.00584884,
0.11464121,
0.023377793,
-0.06902527,
-0.055941124,
-0.05787791,
0.014640494,
0.080320895,
0.0037027278,
-0.030824674,
0.024432683,
0.008549355,
-0.05291309,
-0.06636625,
0.0007468212,
-0.02379191,
0.030766092,
0.054053318,
-0.0027251292,
-0.09928475,
-0.0150488615,
0.016240431,
-0.0015727071,
0.01190173,
0.007895162,
0.04894733,
0.00487708,
0.08263861,
-0.014527478,
-0.043879665,
0.004633697,
0.024611989,
0.023827499,
0.02366802,
0.050754935,
-0.051841788,
0.0212632,
-0.0034418616,
-0.021175656,
0.020591663,
-0.06475325,
0.0542002,
0.027792262,
-0.05295982,
0.01509645,
-0.11977527,
-0.03416359,
-0.012206606,
0.047451705,
0.020876253,
-0.026368074,
0.01502373,
0.033982284,
0.059788153,
-0.052526973,
0.03356499,
0.061180886,
0.096336305,
0.116353564,
-0.016122948
],
"index": 0,
"object": "embedding"
}
],
"model": "all-minilm:l6-v2",
"object": "list",
"usage": {
"prompt_tokens": 5,
"total_tokens": 5
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:streaming_01]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:01.911896-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_inference_store[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:02.652559-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,284 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Hello, world!"
}
],
"stream": true
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": [
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": "Hello",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": "!",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": " How",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": " can",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": " I",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": " assist",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": " you",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": " today",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": "?",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-6f96090aa955",
"choices": [
{
"delta": {
"content": "",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": "stop",
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
}
],
"is_streaming": true
}
}

View file

@ -0,0 +1,40 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:non_streaming_01]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b",
"name": "llama3.2:3b",
"digest": "a80c4f17acd55265feec403c7aef86be0c25983ab279d83f3bcd3abbcb5b8b72",
"expires_at": "2025-10-04T12:20:09.202126-07:00",
"size": 3367856128,
"size_vram": 3367856128,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "Q4_K_M"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,59 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:non_streaming_02]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b",
"name": "llama3.2:3b",
"digest": "a80c4f17acd55265feec403c7aef86be0c25983ab279d83f3bcd3abbcb5b8b72",
"expires_at": "2025-10-04T12:20:09.202126-07:00",
"size": 3367856128,
"size_vram": 3367856128,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "Q4_K_M"
},
"context_length": 4096
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-04T11:27:25.408562-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,284 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "What's the name of the Sun in latin?"
}
],
"stream": true
},
"endpoint": "/v1/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": [
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": "The",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": " Latin",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": " name",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": " for",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": " the",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": " Sun",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": " is",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": " Sol",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": ".",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-12913f20f6ac",
"choices": [
{
"delta": {
"content": "",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": "stop",
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
}
],
"is_streaming": true
}
}

View file

@ -0,0 +1,93 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "What time is it in UTC?"
}
],
"stream": true,
"tools": [
{
"type": "function",
"function": {
"name": "get_time",
"description": "Get current time",
"parameters": {
"type": "object",
"properties": {
"timezone": {
"type": "string"
}
}
}
}
}
]
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": [
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-0fad19b9d308",
"choices": [
{
"delta": {
"content": "{\"name\":\"get_time\",\"parameters\\\":{\\\"timezone\\\":\\\"UTC\\\"}}",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-0fad19b9d308",
"choices": [
{
"delta": {
"content": "",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": "stop",
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
}
],
"is_streaming": true
}
}

View file

@ -0,0 +1,544 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "What is the name of the US captial?"
}
],
"stream": true
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": [
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": "The",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " capital",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " of",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " the",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " United",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " States",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " is",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " Washington",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": ",",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " D",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": ".C",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": ".",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " (",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": "short",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " for",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " District",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " of",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": " Columbia",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": ").",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-325a72db5755",
"choices": [
{
"delta": {
"content": "",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": "stop",
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
}
],
"is_streaming": true
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-True]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:03.361039-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,84 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "What's the weather in Tokyo? Use the get_weather function to get the weather."
}
],
"stream": false,
"tools": [
{
"type": "function",
"function": {
"name": "get_weather",
"description": "Get the weather in a given city",
"parameters": {
"type": "object",
"properties": {
"city": {
"type": "string",
"description": "The city to get the weather for"
}
}
}
}
}
]
},
"endpoint": "/v1/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-35db283fef1d",
"choices": [
{
"finish_reason": "tool_calls",
"index": 0,
"logprobs": null,
"message": {
"content": "",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": [
{
"id": "call_99dd5wna",
"function": {
"arguments": "{\"city\":\"Tokyo\"}",
"name": "get_weather"
},
"type": "function",
"index": 0
}
]
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 15,
"prompt_tokens": 177,
"total_tokens": 192,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_inference_store_tool_calls[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-False]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:08.369100-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_different_inputs_different_outputs[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.330036-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,40 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_completion_non_streaming_suffix[txt=ollama/llama3.2:3b-instruct-fp16-inference:completion:suffix]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:05:44.851615-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,40 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_completion_streaming[txt=ollama/llama3.2:3b-instruct-fp16-inference:completion:sanity]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:05:44.851615-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:streaming_01]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:02.652559-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,421 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_encoding_format_float[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/embeddings",
"headers": {},
"body": {
"model": "all-minilm:l6-v2",
"input": "Test encoding format",
"encoding_format": "float"
},
"endpoint": "/v1/embeddings",
"model": "all-minilm:l6-v2"
},
"response": {
"body": {
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
"__data__": {
"data": [
{
"embedding": [
0.019109152,
-0.0205217,
-0.071471564,
-0.023057504,
-0.06572786,
-0.0057331678,
-0.029395059,
-0.031822033,
-0.015748156,
-0.039123703,
0.02694331,
-0.0641754,
0.013510709,
0.050364953,
-0.03114308,
-0.08322274,
-0.03192984,
0.074970365,
-0.016377378,
-0.0013804765,
0.03850419,
-0.03441017,
-0.0048610102,
-0.03094053,
0.051915165,
0.009193639,
0.0071807485,
0.066353165,
0.024559105,
-0.04767663,
0.0376255,
-0.042586852,
0.078906916,
0.04827334,
0.13389648,
0.013978803,
0.03242126,
-0.08890431,
-0.014188366,
0.03553346,
-0.02476171,
-0.028628638,
0.047652308,
0.026259335,
0.048472118,
0.06663718,
-0.013584004,
0.071824096,
-0.073066786,
-0.050326068,
0.0039502876,
0.03300394,
-0.047816053,
-0.017657546,
0.010284664,
-0.10525716,
-0.010034394,
0.014627846,
-0.053289402,
0.060343288,
-0.10079798,
0.011359217,
-0.007258805,
0.05346498,
-0.0068726647,
0.03697505,
0.024016414,
0.023924585,
-0.011357761,
-0.119573325,
-0.115692526,
-0.06673285,
-0.04233929,
0.09302018,
0.02486003,
0.084047645,
0.0030104683,
-0.06605523,
0.027435688,
-0.032412402,
-0.025584543,
-0.06590182,
0.067799605,
0.0976311,
0.07360619,
0.034108408,
0.056534845,
0.076705806,
-0.05179011,
0.053681813,
0.0054462817,
0.015972052,
0.0035656213,
0.06333522,
-0.01597322,
0.05295729,
0.11539089,
0.055200845,
0.037667733,
0.08083974,
0.035557732,
-0.07982552,
-0.012100598,
-0.07612801,
-0.0695667,
-0.017815348,
0.16996554,
-0.0048157335,
0.09073964,
-0.07196438,
0.020009195,
-0.05956153,
-0.06312686,
-0.07716358,
0.0150949685,
-0.050339524,
-0.05444592,
-0.023078114,
-0.035431463,
-0.030625492,
-0.053284056,
-0.06745872,
-0.08049862,
0.002800386,
-0.0114065055,
-0.029938627,
0.024243163,
-1.5107368e-33,
-0.02984805,
-0.00033025863,
0.0030491,
0.023082128,
-0.04808977,
-0.0027841914,
-0.037461873,
0.016201235,
-0.02998979,
0.015712254,
0.009664366,
-0.03984875,
-0.029493092,
0.03837007,
-0.005226541,
0.06857773,
-0.007891026,
-0.0019036188,
-0.035219382,
0.03627955,
0.05867878,
0.023777487,
0.044425115,
-0.025999734,
-0.025318418,
-0.02685328,
-0.02368557,
-0.094386704,
0.0016880591,
0.0065193563,
-0.09711005,
-0.053493332,
-0.08241291,
0.023502836,
-0.02407441,
0.015992055,
0.0050546136,
0.030476829,
-0.088438906,
0.11427086,
0.028378993,
0.02985018,
0.022821706,
0.018776013,
0.056330692,
-0.020254886,
-0.00070521404,
-0.0864014,
0.020228866,
-0.0039839754,
0.0010032665,
0.065425254,
-0.036518592,
0.032341316,
0.023112345,
0.044507477,
0.09644409,
-0.07272818,
0.03370691,
0.042783204,
-0.052776046,
0.0003352446,
0.061005518,
-0.019623613,
-0.023274273,
-0.11602989,
0.007926991,
-0.12529127,
0.017030548,
0.013484081,
-0.030528491,
-0.024298145,
0.006284904,
-0.015568167,
-0.072781205,
0.012985074,
0.015977127,
0.0051657534,
-0.0026022948,
-0.059578825,
0.06372584,
-0.0019363016,
0.018695941,
-0.009242735,
-0.05887247,
-0.032524884,
-0.009591115,
-0.047377545,
0.020585002,
-0.007134836,
0.050135154,
0.016087264,
-0.0058878902,
-0.07661024,
0.0820671,
1.6053074e-33,
-0.0056476775,
0.06719423,
-0.011510322,
0.05586423,
-0.08886697,
-0.036528286,
0.12134926,
0.028969096,
0.022419011,
0.047327086,
0.07621525,
-0.07937209,
0.0020504447,
-0.023489932,
-0.029759271,
-0.04879825,
-0.034876924,
0.06461666,
0.051493492,
0.008284975,
-0.031793926,
0.098015875,
0.008122038,
0.01032072,
0.059404474,
0.05176487,
0.042960417,
0.0069373515,
0.027306866,
0.039226852,
0.062416088,
0.051797673,
0.0053232666,
0.05965781,
-0.008935817,
-0.0135501,
0.08726531,
0.028408607,
-0.006820522,
0.052098107,
0.049510423,
0.055176627,
-0.016774576,
0.077848226,
0.026121203,
0.031311177,
0.011812256,
-0.0341528,
0.052825138,
0.003484205,
0.09811821,
0.029693138,
-0.031354938,
-0.012068096,
0.018686052,
-0.032609653,
-0.09638639,
0.033928476,
-0.07897009,
-0.008300913,
-0.04915284,
0.02006342,
0.061743837,
-0.018412542,
-0.033583082,
-0.090903476,
0.021116566,
-0.022445552,
-0.011814237,
-0.048816226,
0.048287436,
-0.07294675,
-0.02198573,
0.062477604,
0.023308119,
-0.052141402,
-0.05409648,
0.062339973,
0.052301563,
0.051384836,
-0.02426406,
-0.018824687,
-0.01660311,
0.09330242,
0.008502433,
0.063408315,
0.019377569,
0.047027417,
-0.0058769877,
-0.0034505578,
0.07956527,
0.10210641,
0.015302805,
0.04089992,
0.038895626,
-1.2710905e-08,
-0.019304764,
-0.1217849,
-0.047983564,
-0.053382736,
-0.113197215,
0.05181196,
-0.10498226,
-0.08524135,
0.0061870585,
-0.029899841,
0.064561576,
-0.028730206,
-0.064735174,
-0.024887148,
0.0026119591,
-0.008796896,
0.030246036,
0.009807871,
0.0044631795,
0.0851423,
-0.026132204,
0.11360852,
-0.0045760865,
-0.036643907,
-0.09078616,
0.081466354,
0.012066122,
0.07288108,
0.004079195,
-0.05064171,
0.068772145,
0.029108258,
0.014786602,
-0.11868081,
-0.05042858,
0.05376578,
0.04570744,
0.074074544,
0.028540619,
0.03937392,
0.0291862,
-0.035710927,
-0.09132387,
-0.047720414,
-0.00082342024,
-0.073688805,
0.011024812,
0.015703982,
-0.03590976,
-0.08121826,
0.020365681,
-0.045287356,
-0.024955628,
0.001167751,
0.00037544646,
-0.026392939,
-0.032434102,
0.003407464,
-0.007060387,
0.024250468,
0.076347135,
0.039537415,
0.036043648,
-0.07085338
],
"index": 0,
"object": "embedding"
}
],
"model": "all-minilm:l6-v2",
"object": "list",
"usage": {
"prompt_tokens": 3,
"total_tokens": 3
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,104 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "What's the weather in Tokyo? Use the get_weather function to get the weather."
}
],
"stream": true,
"tools": [
{
"type": "function",
"function": {
"name": "get_weather",
"description": "Get the weather in a given city",
"parameters": {
"type": "object",
"properties": {
"city": {
"type": "string",
"description": "The city to get the weather for"
}
}
}
}
}
]
},
"endpoint": "/v1/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": [
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-4014dd44c15f",
"choices": [
{
"delta": {
"content": "",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": [
{
"index": 0,
"id": "call_9732h2cb",
"function": {
"arguments": "{\"city\":\"Tokyo\"}",
"name": "get_weather"
},
"type": "function"
}
]
},
"finish_reason": null,
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
"__data__": {
"id": "rec-4014dd44c15f",
"choices": [
{
"delta": {
"content": "",
"function_call": null,
"refusal": null,
"role": "assistant",
"tool_calls": null
},
"finish_reason": "tool_calls",
"index": 0,
"logprobs": null
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion.chunk",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": null
}
}
],
"is_streaming": true
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_base64_batch_processing[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,56 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Hello, world!"
}
],
"stream": false
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-a4c8d19bb1eb",
"choices": [
{
"finish_reason": "stop",
"index": 0,
"logprobs": null,
"message": {
"content": "Hello! It's nice to meet you. Is there something I can help you with or would you like to chat?",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": null
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 25,
"prompt_tokens": 29,
"total_tokens": 54,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,40 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_completion_guided_choice[txt=ollama/llama3.2:3b-instruct-fp16]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:05:47.301578-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_invalid_model_error[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.330036-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_encoding_format_float[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.077957-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,86 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "What's the weather in San Francisco?"
}
],
"tools": [
{
"type": "function",
"function": {
"name": "get_weather",
"description": "Get weather for a location",
"parameters": {
"type": "object",
"properties": {
"location": {
"type": "string",
"description": "City name"
}
},
"required": [
"location"
]
}
}
}
]
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-931ac7158789",
"choices": [
{
"finish_reason": "tool_calls",
"index": 0,
"logprobs": null,
"message": {
"content": "",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": [
{
"id": "call_t7y6oe6q",
"function": {
"arguments": "{\"location\":\"San Francisco\"}",
"name": "get_weather"
},
"type": "function",
"index": 0
}
]
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 18,
"prompt_tokens": 161,
"total_tokens": 179,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_encoding_format_base64[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

File diff suppressed because one or more lines are too long

View file

@ -0,0 +1,117 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Book a flight from SFO to JFK for John Doe"
}
],
"tools": [
{
"type": "function",
"function": {
"name": "book_flight",
"description": "Book a flight",
"parameters": {
"type": "object",
"properties": {
"flight": {
"$ref": "#/$defs/FlightInfo"
},
"passenger": {
"$ref": "#/$defs/Passenger"
}
},
"required": [
"flight",
"passenger"
],
"$defs": {
"FlightInfo": {
"type": "object",
"properties": {
"from": {
"type": "string"
},
"to": {
"type": "string"
},
"date": {
"type": "string",
"format": "date"
}
}
},
"Passenger": {
"type": "object",
"properties": {
"name": {
"type": "string"
},
"age": {
"type": "integer"
}
}
}
}
}
}
}
]
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-d9e8f66e1d85",
"choices": [
{
"finish_reason": "tool_calls",
"index": 0,
"logprobs": null,
"message": {
"content": "",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": [
{
"id": "call_bdq6iic2",
"function": {
"arguments": "{\"flight\":\"{\\\"date\\\":\\\"2023-08-20\\\",\\\"from\\\":\\\"SFO\\\",\\\"to\\\":\\\"JFK\\\"}\",\"passenger\":\"{\\\"age\\\":30,\\\"name\\\":\\\"John Doe\\\"}\"}",
"name": "book_flight"
},
"type": "function",
"index": 0
}
]
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 52,
"prompt_tokens": 227,
"total_tokens": 279,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_empty_list_error[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.330036-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Call the no args tool"
}
],
"tools": [
{
"type": "function",
"function": {
"name": "no_args_tool",
"description": "Tool with no arguments",
"parameters": {
"type": "object",
"properties": {}
}
}
}
]
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-c4991de37dfb",
"choices": [
{
"finish_reason": "tool_calls",
"index": 0,
"logprobs": null,
"message": {
"content": "",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": [
{
"id": "call_wbx3rwxz",
"function": {
"arguments": "{}",
"name": "no_args_tool"
},
"type": "function",
"index": 0
}
]
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 14,
"prompt_tokens": 148,
"total_tokens": 162,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,59 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_single_string[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,57 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:non_streaming_01]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Which planet do humans live on?"
}
],
"stream": false
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-acdd905b0481",
"choices": [
{
"finish_reason": "stop",
"index": 0,
"logprobs": null,
"message": {
"content": "Humans live on Earth. It is the third planet from the Sun and the only known planet in the universe that supports life.",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": null
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 26,
"prompt_tokens": 32,
"total_tokens": 58,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,989 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"prompt": "Respond to this question and explain your answer. Complete the sentence using one word: Roses are red, violets are ",
"max_tokens": 50,
"stream": true
},
"endpoint": "/v1/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": [
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "Blue"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": ".\n\n"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "My"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " answer"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " is"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " blue"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " because"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " it"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "'s"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " a"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " common"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " and"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " well"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "-known"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " completion"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " of"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " the"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " classic"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " tongue"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "-tw"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "ister"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " \""
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "R"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "oses"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " are"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " red"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": ","
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " v"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "io"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "lets"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " are"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "\""
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " \u2013"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " often"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " followed"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " by"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " the"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " phrase"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " \""
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": "blue"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": ".\""
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " This"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " rhyme"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " has"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " been"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " widely"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " used"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " in"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": " literature"
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": null,
"index": 0,
"logprobs": null,
"text": ","
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
},
{
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-84cab42e1f5c",
"choices": [
{
"finish_reason": "length",
"index": 0,
"logprobs": null,
"text": ""
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": null
}
}
],
"is_streaming": true
}
}

View file

@ -0,0 +1,43 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"prompt": "Respond to this question and explain your answer. Complete the sentence using one word: Roses are red, violets are ",
"stream": false,
"extra_body": {}
},
"endpoint": "/v1/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.completion.Completion",
"__data__": {
"id": "rec-6412295819a1",
"choices": [
{
"finish_reason": "stop",
"index": 0,
"logprobs": null,
"text": "Blue.\n\nMy answer is \"blue\" because it's a classic completion of the traditional nursery rhyme poem:\n\n\"Roses are red, violets are blue\"\n\nThis sentiment suggests that an unseen suitor from the first half of the line has given or will give the speaker roses."
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "text_completion",
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 58,
"prompt_tokens": 50,
"total_tokens": 108,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:streaming_02]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:05.551205-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,421 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_single_string[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/embeddings",
"headers": {},
"body": {
"model": "all-minilm:l6-v2",
"input": "Hello, world!",
"encoding_format": "float"
},
"endpoint": "/v1/embeddings",
"model": "all-minilm:l6-v2"
},
"response": {
"body": {
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
"__data__": {
"data": [
{
"embedding": [
-0.038168654,
0.032873917,
-0.0055947267,
0.014366432,
-0.040310103,
-0.116643615,
0.031721067,
0.0019260457,
-0.04255802,
0.029198613,
0.04252229,
0.032184314,
0.029838374,
0.010959321,
-0.053805783,
-0.05028783,
-0.023449864,
0.0107550435,
-0.13774979,
0.0039929547,
0.029302042,
0.066712305,
-0.015410682,
0.048422653,
-0.08814465,
-0.012715775,
0.041334823,
0.040851083,
-0.050064698,
-0.05804616,
0.048728727,
0.06888658,
0.058795262,
0.008804153,
-0.016073612,
0.08514259,
-0.078146815,
-0.07741974,
0.020842256,
0.016201088,
0.032518543,
-0.05346469,
-0.062197812,
-0.024271712,
0.007416788,
0.024103774,
0.006469804,
0.051166162,
0.07284196,
0.034627657,
-0.05475476,
-0.059386417,
-0.0071934434,
0.020163197,
0.035816014,
0.0055927313,
0.010762318,
-0.05274177,
0.010083032,
-0.008742163,
-0.06284565,
0.038426206,
-0.013933317,
0.07342759,
0.09004579,
-0.07995627,
-0.016420787,
0.044767782,
-0.06886435,
-0.03303916,
-0.015482072,
0.011322529,
0.036461752,
0.066346884,
-0.05434455,
0.008740993,
0.012066104,
-0.038101126,
0.0069316486,
0.051146947,
0.07740579,
-0.122950904,
0.016380342,
0.049568996,
0.031634904,
-0.039637603,
0.0016715266,
0.009577405,
-0.032646418,
-0.033988595,
-0.13329837,
0.0072566303,
-0.010266605,
0.038557075,
-0.09338859,
-0.041706774,
0.069941126,
-0.026323376,
-0.14971305,
0.13445398,
0.03748492,
0.052825302,
0.0450506,
0.018712776,
0.05444322,
0.017282845,
-0.032480195,
0.04614526,
-0.046711974,
-0.030566413,
-0.01820007,
-0.04869831,
0.033051647,
-0.0038142777,
0.04999665,
-0.058270358,
-0.010011706,
0.010643473,
-0.040113144,
-0.0015507729,
0.060854245,
-0.045562096,
0.049257778,
0.02612153,
0.01981428,
-0.001660993,
0.059509434,
-6.525298e-33,
0.063519135,
0.0030875143,
0.028961418,
0.1733713,
0.0029763067,
0.027727291,
-0.0951315,
-0.031186627,
0.026689058,
-0.010807322,
0.023850724,
0.023777472,
-0.031174092,
0.049501278,
-0.025049716,
0.10175924,
-0.07919064,
-0.0032249284,
0.042915843,
0.09483459,
-0.06652636,
0.006303593,
0.02220902,
0.06999181,
-0.0074810013,
-0.0017734945,
0.027008688,
-0.07534615,
0.114036545,
0.008552313,
-0.023737878,
-0.04694563,
0.014472103,
0.019855395,
-0.0046694353,
0.0013555645,
-0.034298304,
-0.054142635,
-0.09419824,
-0.028909719,
-0.018876282,
0.0457315,
0.04761082,
-0.0030971593,
-0.033264168,
-0.013539523,
0.051041685,
0.031110944,
0.015244497,
0.054158635,
-0.08499706,
0.013360703,
-0.04759633,
0.07101136,
-0.0131114535,
-0.0023818254,
0.050331973,
-0.041642286,
-0.01419894,
0.032463223,
0.0053973934,
0.091275506,
0.0044798073,
-0.018260129,
-0.015278888,
-0.046306957,
0.038750377,
0.014729783,
0.05204642,
0.0017938613,
-0.014963651,
0.027101943,
0.031203475,
0.023725478,
-0.004601222,
0.03617344,
0.06679477,
-0.0018401983,
0.021265576,
-0.057589985,
0.019155758,
0.031437635,
-0.018444614,
-0.04085069,
0.10393101,
0.011960795,
-0.014898805,
-0.10520497,
-0.012302656,
-0.00043837292,
-0.09508398,
0.058318105,
0.042576887,
-0.025066672,
-0.094555676,
4.0072287e-33,
0.1322281,
0.0053512393,
-0.03312536,
-0.09096454,
-0.031562407,
-0.033949774,
-0.07205118,
0.1259232,
-0.08333555,
0.052797858,
0.001077506,
0.022004265,
0.10402767,
0.013034249,
0.04091762,
0.018705815,
0.11424037,
0.024799824,
0.014582492,
0.006205516,
-0.011202356,
-0.035756435,
-0.03800272,
0.011251353,
-0.0512988,
0.007890417,
0.06736164,
0.0033359542,
-0.09285096,
0.03704081,
-0.022326592,
0.039967872,
-0.030748183,
-0.011446819,
-0.014453254,
0.02498229,
-0.097532175,
-0.035378877,
-0.03757795,
-0.010181498,
-0.06392041,
0.025538994,
0.02061816,
0.03757256,
-0.1043548,
-0.028326731,
-0.05209465,
0.0128473425,
-0.051238894,
-0.029034877,
-0.09633617,
-0.042309195,
0.067165054,
-0.030870603,
-0.010357507,
0.027381465,
-0.028105576,
0.010302046,
0.04306986,
0.022315372,
0.007954779,
0.056068663,
0.04071972,
0.09293905,
0.016536433,
-0.053764775,
0.00047211433,
0.050708972,
0.042510226,
-0.029195962,
0.009274875,
-0.010647389,
-0.037209682,
0.002267011,
-0.030304702,
0.0745741,
0.0026207205,
-0.017582772,
0.0028797672,
0.038404796,
0.00723137,
0.045613218,
0.03998252,
0.014209623,
-0.0142997475,
0.05850862,
0.03630791,
0.055294298,
-0.020075988,
-0.08041808,
-0.030250112,
-0.014920701,
0.022349516,
0.011911506,
-0.06903851,
-1.8806734e-08,
-0.078480355,
0.046674173,
-0.023920896,
0.0634942,
0.02396477,
0.0014517035,
-0.090798445,
-0.06684978,
-0.0801405,
0.005503192,
0.053675175,
0.104841895,
-0.066848256,
0.015522683,
0.067097165,
0.070832625,
-0.03197915,
0.020843629,
-0.0219202,
-0.0073016756,
-0.010645817,
0.0040983153,
0.03313765,
-0.0790081,
0.03878132,
-0.075230986,
-0.015732396,
0.0060099233,
0.0051297406,
-0.061492138,
0.04202211,
0.09544608,
-0.04318599,
0.014424486,
-0.10617826,
-0.027963417,
0.011034413,
0.069576606,
0.06689785,
-0.07479674,
-0.07851099,
0.042766396,
-0.034639932,
-0.10607304,
-0.03577663,
0.051540814,
0.068673156,
-0.049959548,
0.015460458,
-0.064520314,
-0.076010585,
0.026035817,
0.07440218,
-0.012396022,
0.13329679,
0.074770845,
0.05134284,
0.020977058,
-0.026776016,
0.08894323,
0.039937407,
-0.04102053,
0.03194075,
0.018113315
],
"index": 0,
"object": "embedding"
}
],
"model": "all-minilm:l6-v2",
"object": "list",
"usage": {
"prompt_tokens": 4,
"total_tokens": 4
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_streaming_with_n[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:streaming_02]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:06.898917-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,57 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_chat_completion_non_streaming[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-inference:chat_completion:non_streaming_02]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Which planet has rings around it with a name starting with letter S?"
}
],
"stream": false
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-d94bbf50e754",
"choices": [
{
"finish_reason": "stop",
"index": 0,
"logprobs": null,
"message": {
"content": "You are probably thinking of Saturn. Saturn is the only planet in our solar system with noticeable ring systems, and its main ring system is called the Solar System's S Ring.",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": null
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 36,
"prompt_tokens": 39,
"total_tokens": 75,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,20 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_openai_completion_non_streaming[txt=ollama/llama3.2:3b-instruct-fp16-inference:completion:sanity]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": []
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,421 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_different_inputs_different_outputs[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/embeddings",
"headers": {},
"body": {
"model": "all-minilm:l6-v2",
"input": "This is completely different content",
"encoding_format": "float"
},
"endpoint": "/v1/embeddings",
"model": "all-minilm:l6-v2"
},
"response": {
"body": {
"__type__": "openai.types.create_embedding_response.CreateEmbeddingResponse",
"__data__": {
"data": [
{
"embedding": [
0.050927628,
0.038399037,
-0.05559374,
-0.105984606,
0.06944504,
-0.08054001,
-0.025946686,
-0.045175657,
0.068730615,
0.016510814,
-0.0011700827,
0.023414683,
-0.0034143464,
0.06804153,
-0.021997927,
-0.014162646,
0.12356902,
-0.06536738,
-0.082627006,
0.04300477,
-0.039514318,
0.055434275,
-0.008866895,
0.020934915,
0.016280092,
0.09630312,
-0.022835929,
0.09175565,
0.06409549,
-0.06226981,
0.010888244,
0.07833004,
0.08844764,
-0.008459277,
-0.07542651,
0.04800223,
0.0042286967,
0.037884884,
0.0023502677,
0.032233667,
0.0047689923,
-0.070404515,
-0.06513966,
0.061046362,
0.021522248,
0.10113185,
-0.07537441,
-0.04074795,
-0.0055522234,
-0.0037093374,
-0.021283673,
-0.018193243,
-0.03323253,
-0.015658593,
0.0032862085,
0.037399907,
-0.021028537,
0.052572608,
0.10211333,
-0.018634265,
0.03612266,
0.08958185,
0.050681055,
0.019839589,
0.10220134,
-0.059074707,
-0.045562137,
-0.024107283,
-0.059917513,
-0.09795064,
-0.002078402,
0.032211803,
0.04863422,
0.08062527,
0.022614514,
0.0005379622,
-0.0015465368,
0.010018953,
-0.089729026,
0.023838207,
-0.015227461,
-0.020540234,
0.08525423,
-0.08025672,
-0.002200058,
0.0649954,
-0.023069935,
-0.06201302,
-0.06545048,
-0.029986514,
0.0045501734,
0.09718718,
0.09153336,
-0.0059684636,
-0.048185453,
-0.011855243,
-0.03170323,
-0.010363732,
0.029717747,
0.103405535,
-0.029072085,
0.005597891,
-0.03075466,
-0.011073092,
-0.038647823,
-0.01590583,
0.0008562756,
0.03479237,
0.0039463183,
-0.020063022,
-0.048164852,
0.026510539,
-0.061183933,
-0.046969693,
0.02144617,
-0.048452575,
0.02205527,
0.015723849,
0.056344535,
0.055321235,
0.037136998,
-0.08872732,
0.011813868,
0.0064246035,
-0.020590257,
-0.059401207,
0.012338125,
-2.4301395e-33,
0.068363585,
-0.05303797,
0.011494271,
0.06953355,
0.013304427,
0.0020351785,
-0.020783585,
0.028951883,
0.034663863,
-0.03274387,
0.00095708756,
0.008672852,
0.007618213,
-0.024579093,
0.030253874,
-0.034167152,
-0.0315152,
0.1105276,
0.03499844,
0.045135163,
0.00044455956,
0.051429555,
0.015050582,
-0.009024664,
0.023132037,
0.05141033,
-0.00417506,
0.004720958,
-0.016197585,
-0.025692327,
-0.024077175,
-0.00953031,
0.05060433,
-0.058328744,
0.04903431,
0.07964924,
0.03599398,
-0.065374464,
-0.035382472,
-0.07028972,
-0.009750123,
-0.031909473,
-0.04101604,
-0.041144423,
-0.036323845,
0.06685511,
0.016679594,
-0.048498012,
-0.015474575,
-0.00048608257,
0.03267068,
-0.010890426,
0.016646467,
-0.057286758,
0.008073807,
0.008808943,
-0.061580453,
-0.010815387,
0.0717443,
0.08607838,
0.014073375,
0.014896061,
-0.098295614,
-0.046653833,
0.033601493,
0.0647405,
-0.007525925,
0.025440095,
0.04171436,
-0.033113986,
-0.014553822,
0.024878975,
0.045614205,
-0.042929318,
-0.040504646,
-0.06304663,
-0.022389242,
0.010583584,
-0.032525852,
-0.03146621,
0.0081922775,
0.021094568,
0.0095269885,
-0.08290188,
-0.021351986,
0.008777032,
0.060185786,
-0.062182017,
0.004518251,
0.05684528,
-0.013033095,
0.01867297,
-0.008998785,
-0.076766245,
0.051622886,
1.6926977e-33,
-0.12588808,
0.011676749,
-0.079886116,
0.02304184,
0.029238446,
0.08721121,
0.06906221,
0.032533444,
0.047794122,
0.13212898,
0.03129717,
-0.0125368,
0.0035920327,
-0.016413208,
-0.038557872,
0.016005918,
0.09166447,
0.047558285,
-0.054981478,
0.06797876,
0.017968502,
0.118666455,
-0.069318265,
0.043814093,
0.04150938,
-0.017812226,
0.051738504,
0.06795029,
0.080493495,
0.005386888,
0.08878265,
-0.036075104,
-0.07708273,
-0.09101018,
-0.09597232,
-0.0937606,
-0.06200779,
0.06722552,
-0.0006647803,
0.029067127,
0.08179574,
-0.06488274,
-0.050375167,
-0.002403243,
-0.026110265,
-0.007630271,
0.011972527,
-0.08573929,
0.04107404,
0.024723932,
-0.02222756,
-0.11560156,
0.006753066,
-0.04589066,
-0.06369223,
0.053635046,
0.005769477,
0.06325056,
0.0048679966,
-0.057087842,
0.041931894,
0.022344982,
-0.14709935,
0.026361033,
0.106274396,
-0.0059068515,
0.020035667,
0.034950804,
-0.03342695,
-0.03884034,
-0.076072656,
-0.11173452,
-0.038953967,
-0.10270519,
0.04714134,
-0.049391687,
0.074747935,
0.041724026,
-0.031083144,
0.0033830043,
0.055804495,
-0.031882074,
-0.02541756,
0.050101582,
0.035991114,
0.09143438,
-0.07581111,
-0.050589707,
0.0074097887,
-0.0014020415,
-0.05036443,
-0.0015289022,
0.005471816,
0.07689256,
0.014164922,
-1.8297508e-08,
0.029913928,
-0.057959806,
-0.06846765,
0.026196472,
-0.0035178436,
0.11374637,
0.056845777,
-0.09315407,
0.0027757618,
0.10895455,
-0.033027817,
0.005051668,
-0.043633904,
-0.048978273,
0.011912417,
0.059747256,
-0.08661686,
-0.052748058,
0.026321623,
0.042173225,
-0.0035451513,
0.03797019,
0.022595786,
-0.0614702,
0.01268269,
0.040893063,
-0.084825225,
0.041167296,
-0.038163006,
0.008364558,
0.01014753,
0.024994388,
-0.012504467,
-0.045078665,
0.0102669485,
-0.046302866,
0.061438397,
0.016235871,
-0.0011558776,
0.007455159,
-0.019448454,
-0.06798961,
0.05472832,
0.09646006,
-0.04711737,
0.060088705,
0.0030213061,
-0.08877283,
0.037262574,
-0.009947699,
0.0035697597,
-0.07833652,
0.02169359,
-0.013075168,
0.072521746,
-0.0649658,
-0.029920656,
-0.017777385,
0.033904497,
0.02919506,
0.08793891,
0.008437021,
0.064442866,
-0.01656208
],
"index": 0,
"object": "embedding"
}
],
"model": "all-minilm:l6-v2",
"object": "list",
"usage": {
"prompt_tokens": 5,
"total_tokens": 5
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_multiple_strings[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:54.969937-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,97 @@
{
"request": {
"method": "POST",
"url": "http://0.0.0.0:11434/v1/v1/chat/completions",
"headers": {},
"body": {
"model": "llama3.2:3b-instruct-fp16",
"messages": [
{
"role": "user",
"content": "Calculate 5 + 3"
}
],
"tools": [
{
"type": "function",
"function": {
"name": "calculate",
"description": "",
"parameters": {
"properties": {
"x": {
"title": "X",
"type": "number"
},
"y": {
"title": "Y",
"type": "number"
},
"operation": {
"title": "Operation",
"type": "string"
}
},
"required": [
"x",
"y",
"operation"
],
"title": "calculateArguments",
"type": "object"
}
}
}
]
},
"endpoint": "/v1/chat/completions",
"model": "llama3.2:3b-instruct-fp16"
},
"response": {
"body": {
"__type__": "openai.types.chat.chat_completion.ChatCompletion",
"__data__": {
"id": "rec-cca0267555a6",
"choices": [
{
"finish_reason": "tool_calls",
"index": 0,
"logprobs": null,
"message": {
"content": "",
"refusal": null,
"role": "assistant",
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": [
{
"id": "call_px63ad04",
"function": {
"arguments": "{\"operation\":\"+\",\"x\":\"5\",\"y\":\"3\"}",
"name": "calculate"
},
"type": "function",
"index": 0
}
]
}
}
],
"created": 0,
"model": "llama3.2:3b-instruct-fp16",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": "fp_ollama",
"usage": {
"completion_tokens": 27,
"prompt_tokens": 172,
"total_tokens": 199,
"completion_tokens_details": null,
"prompt_tokens_details": null
}
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_embeddings.py::test_openai_embeddings_with_user_parameter[llama_stack_client-emb=ollama/all-minilm:l6-v2]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.245344-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:06:54.261283-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}

View file

@ -0,0 +1,78 @@
{
"test_id": "tests/integration/inference/test_openai_completion.py::test_inference_store[client_with_models-txt=ollama/llama3.2:3b-instruct-fp16-False]",
"request": {
"method": "POST",
"url": "http://localhost:11434/api/ps",
"headers": {},
"body": {},
"endpoint": "/api/ps",
"model": ""
},
"response": {
"body": {
"__type__": "ollama._types.ProcessResponse",
"__data__": {
"models": [
{
"model": "llama3.2:3b-instruct-fp16",
"name": "llama3.2:3b-instruct-fp16",
"digest": "195a8c01d91ec3cb1e0aad4624a51f2602c51fa7d96110f8ab5a20c84081804d",
"expires_at": "2025-10-03T20:07:06.898917-07:00",
"size": 7919570944,
"size_vram": 7919570944,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "3.2B",
"quantization_level": "F16"
},
"context_length": 4096
},
{
"model": "all-minilm:l6-v2",
"name": "all-minilm:l6-v2",
"digest": "1b226e2802dbb772b5fc32a58f103ca1804ef7501331012de126ab22f67475ef",
"expires_at": "2025-10-03T20:06:55.533878-07:00",
"size": 585846784,
"size_vram": 585846784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "bert",
"families": [
"bert"
],
"parameter_size": "23M",
"quantization_level": "F16"
},
"context_length": 256
},
{
"model": "llama-guard3:1b",
"name": "llama-guard3:1b",
"digest": "494147e06bf99e10dbe67b63a07ac81c162f18ef3341aa3390007ac828571b3b",
"expires_at": "2025-10-03T20:06:23.356289-07:00",
"size": 2350966784,
"size_vram": 2350966784,
"details": {
"parent_model": "",
"format": "gguf",
"family": "llama",
"families": [
"llama"
],
"parameter_size": "1.5B",
"quantization_level": "Q8_0"
},
"context_length": 4096
}
]
}
},
"is_streaming": false
}
}