mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-14 06:23:45 +00:00
# What does this PR do? Allows passing through extra_body parameters to inference providers. closes #2720 ## Test Plan CI and added new test
80 lines
1.9 KiB
JSON
80 lines
1.9 KiB
JSON
{
|
|
"test_id": null,
|
|
"request": {
|
|
"method": "POST",
|
|
"url": "http://0.0.0.0:11434/v1/v1/models",
|
|
"headers": {},
|
|
"body": {},
|
|
"endpoint": "/v1/models",
|
|
"model": ""
|
|
},
|
|
"response": {
|
|
"body": [
|
|
{
|
|
"__type__": "openai.types.model.Model",
|
|
"__data__": {
|
|
"id": "llama3.2-vision:11b",
|
|
"created": 1759959879,
|
|
"object": "model",
|
|
"owned_by": "library"
|
|
}
|
|
},
|
|
{
|
|
"__type__": "openai.types.model.Model",
|
|
"__data__": {
|
|
"id": "nomic-embed-text:latest",
|
|
"created": 1754610899,
|
|
"object": "model",
|
|
"owned_by": "library"
|
|
}
|
|
},
|
|
{
|
|
"__type__": "openai.types.model.Model",
|
|
"__data__": {
|
|
"id": "llama-guard3:1b",
|
|
"created": 1754088388,
|
|
"object": "model",
|
|
"owned_by": "library"
|
|
}
|
|
},
|
|
{
|
|
"__type__": "openai.types.model.Model",
|
|
"__data__": {
|
|
"id": "all-minilm:l6-v2",
|
|
"created": 1753826826,
|
|
"object": "model",
|
|
"owned_by": "library"
|
|
}
|
|
},
|
|
{
|
|
"__type__": "openai.types.model.Model",
|
|
"__data__": {
|
|
"id": "all-minilm:latest",
|
|
"created": 1749064003,
|
|
"object": "model",
|
|
"owned_by": "library"
|
|
}
|
|
},
|
|
{
|
|
"__type__": "openai.types.model.Model",
|
|
"__data__": {
|
|
"id": "llama3.1:8b-instruct-fp16",
|
|
"created": 1739575404,
|
|
"object": "model",
|
|
"owned_by": "library"
|
|
}
|
|
},
|
|
{
|
|
"__type__": "openai.types.model.Model",
|
|
"__data__": {
|
|
"id": "llama3.2:3b-instruct-fp16",
|
|
"created": 1737496003,
|
|
"object": "model",
|
|
"owned_by": "library"
|
|
}
|
|
}
|
|
],
|
|
"is_streaming": false
|
|
},
|
|
"id_normalization_mapping": {}
|
|
}
|