diff --git a/docs/static/llama-stack-spec.html b/docs/static/llama-stack-spec.html
index 9e28e0f42..c7e2b5ea2 100644
--- a/docs/static/llama-stack-spec.html
+++ b/docs/static/llama-stack-spec.html
@@ -427,7 +427,7 @@
}
}
},
- "/v1/openai/v1/responses": {
+ "/v1/responses": {
"get": {
"responses": {
"200": {
@@ -809,7 +809,7 @@
]
}
},
- "/v1/openai/v1/responses/{response_id}": {
+ "/v1/responses/{response_id}": {
"get": {
"responses": {
"200": {
@@ -1478,7 +1478,7 @@
]
}
},
- "/v1/openai/v1/chat/completions/{completion_id}": {
+ "/v1/chat/completions/{completion_id}": {
"get": {
"responses": {
"200": {
@@ -3193,7 +3193,7 @@
}
}
},
- "/v1/openai/v1/chat/completions": {
+ "/v1/chat/completions": {
"get": {
"responses": {
"200": {
@@ -3393,11 +3393,11 @@
"get": {
"responses": {
"200": {
- "description": "A ListModelsResponse.",
+ "description": "A OpenAIListModelsResponse.",
"content": {
"application/json": {
"schema": {
- "$ref": "#/components/schemas/ListModelsResponse"
+ "$ref": "#/components/schemas/OpenAIListModelsResponse"
}
}
}
@@ -3418,8 +3418,8 @@
"tags": [
"Models"
],
- "summary": "List all models.",
- "description": "List all models.",
+ "summary": "List models using the OpenAI API.",
+ "description": "List models using the OpenAI API.",
"parameters": []
},
"post": {
@@ -3465,7 +3465,7 @@
}
}
},
- "/v1/openai/v1/responses/{response_id}/input_items": {
+ "/v1/responses/{response_id}/input_items": {
"get": {
"responses": {
"200": {
@@ -4093,7 +4093,7 @@
}
}
},
- "/v1/openai/v1/vector_stores/{vector_store_id}/files": {
+ "/v1/vector_stores/{vector_store_id}/files": {
"get": {
"responses": {
"200": {
@@ -4234,7 +4234,7 @@
}
}
},
- "/v1/openai/v1/completions": {
+ "/v1/completions": {
"post": {
"responses": {
"200": {
@@ -4278,7 +4278,7 @@
}
}
},
- "/v1/openai/v1/vector_stores": {
+ "/v1/vector_stores": {
"get": {
"responses": {
"200": {
@@ -4391,7 +4391,7 @@
}
}
},
- "/v1/openai/v1/files/{file_id}": {
+ "/v1/files/{file_id}": {
"get": {
"responses": {
"200": {
@@ -4477,7 +4477,7 @@
]
}
},
- "/v1/openai/v1/vector_stores/{vector_store_id}": {
+ "/v1/vector_stores/{vector_store_id}": {
"get": {
"responses": {
"200": {
@@ -4615,7 +4615,7 @@
]
}
},
- "/v1/openai/v1/vector_stores/{vector_store_id}/files/{file_id}": {
+ "/v1/vector_stores/{vector_store_id}/files/{file_id}": {
"get": {
"responses": {
"200": {
@@ -4780,7 +4780,7 @@
]
}
},
- "/v1/openai/v1/embeddings": {
+ "/v1/embeddings": {
"post": {
"responses": {
"200": {
@@ -4824,7 +4824,7 @@
}
}
},
- "/v1/openai/v1/files": {
+ "/v1/files": {
"get": {
"responses": {
"200": {
@@ -4972,41 +4972,7 @@
}
}
},
- "/v1/openai/v1/models": {
- "get": {
- "responses": {
- "200": {
- "description": "A OpenAIListModelsResponse.",
- "content": {
- "application/json": {
- "schema": {
- "$ref": "#/components/schemas/OpenAIListModelsResponse"
- }
- }
- }
- },
- "400": {
- "$ref": "#/components/responses/BadRequest400"
- },
- "429": {
- "$ref": "#/components/responses/TooManyRequests429"
- },
- "500": {
- "$ref": "#/components/responses/InternalServerError500"
- },
- "default": {
- "$ref": "#/components/responses/DefaultError"
- }
- },
- "tags": [
- "Models"
- ],
- "summary": "List models using the OpenAI API.",
- "description": "List models using the OpenAI API.",
- "parameters": []
- }
- },
- "/v1/openai/v1/files/{file_id}/content": {
+ "/v1/files/{file_id}/content": {
"get": {
"responses": {
"200": {
@@ -5050,7 +5016,7 @@
]
}
},
- "/v1/openai/v1/vector_stores/{vector_store_id}/files/{file_id}/content": {
+ "/v1/vector_stores/{vector_store_id}/files/{file_id}/content": {
"get": {
"responses": {
"200": {
@@ -5103,7 +5069,7 @@
]
}
},
- "/v1/openai/v1/vector_stores/{vector_store_id}/search": {
+ "/v1/vector_stores/{vector_store_id}/search": {
"post": {
"responses": {
"200": {
@@ -5704,7 +5670,7 @@
}
}
},
- "/v1/openai/v1/moderations": {
+ "/v1/moderations": {
"post": {
"responses": {
"200": {
diff --git a/docs/static/llama-stack-spec.yaml b/docs/static/llama-stack-spec.yaml
index 1c06c74a5..fc6114e43 100644
--- a/docs/static/llama-stack-spec.yaml
+++ b/docs/static/llama-stack-spec.yaml
@@ -286,7 +286,7 @@ paths:
schema:
$ref: '#/components/schemas/CreateAgentTurnRequest'
required: true
- /v1/openai/v1/responses:
+ /v1/responses:
get:
responses:
'200':
@@ -558,7 +558,7 @@ paths:
required: true
schema:
type: string
- /v1/openai/v1/responses/{response_id}:
+ /v1/responses/{response_id}:
get:
responses:
'200':
@@ -1033,7 +1033,7 @@ paths:
required: true
schema:
type: string
- /v1/openai/v1/chat/completions/{completion_id}:
+ /v1/chat/completions/{completion_id}:
get:
responses:
'200':
@@ -2259,7 +2259,7 @@ paths:
schema:
$ref: '#/components/schemas/RegisterBenchmarkRequest'
required: true
- /v1/openai/v1/chat/completions:
+ /v1/chat/completions:
get:
responses:
'200':
@@ -2403,11 +2403,11 @@ paths:
get:
responses:
'200':
- description: A ListModelsResponse.
+ description: A OpenAIListModelsResponse.
content:
application/json:
schema:
- $ref: '#/components/schemas/ListModelsResponse'
+ $ref: '#/components/schemas/OpenAIListModelsResponse'
'400':
$ref: '#/components/responses/BadRequest400'
'429':
@@ -2420,8 +2420,8 @@ paths:
$ref: '#/components/responses/DefaultError'
tags:
- Models
- summary: List all models.
- description: List all models.
+ summary: List models using the OpenAI API.
+ description: List models using the OpenAI API.
parameters: []
post:
responses:
@@ -2452,7 +2452,7 @@ paths:
schema:
$ref: '#/components/schemas/RegisterModelRequest'
required: true
- /v1/openai/v1/responses/{response_id}/input_items:
+ /v1/responses/{response_id}/input_items:
get:
responses:
'200':
@@ -2906,7 +2906,7 @@ paths:
schema:
$ref: '#/components/schemas/LogEventRequest'
required: true
- /v1/openai/v1/vector_stores/{vector_store_id}/files:
+ /v1/vector_stores/{vector_store_id}/files:
get:
responses:
'200':
@@ -3015,7 +3015,7 @@ paths:
schema:
$ref: '#/components/schemas/OpenaiAttachFileToVectorStoreRequest'
required: true
- /v1/openai/v1/completions:
+ /v1/completions:
post:
responses:
'200':
@@ -3049,7 +3049,7 @@ paths:
schema:
$ref: '#/components/schemas/OpenaiCompletionRequest'
required: true
- /v1/openai/v1/vector_stores:
+ /v1/vector_stores:
get:
responses:
'200':
@@ -3136,7 +3136,7 @@ paths:
schema:
$ref: '#/components/schemas/OpenaiCreateVectorStoreRequest'
required: true
- /v1/openai/v1/files/{file_id}:
+ /v1/files/{file_id}:
get:
responses:
'200':
@@ -3201,7 +3201,7 @@ paths:
required: true
schema:
type: string
- /v1/openai/v1/vector_stores/{vector_store_id}:
+ /v1/vector_stores/{vector_store_id}:
get:
responses:
'200':
@@ -3298,7 +3298,7 @@ paths:
required: true
schema:
type: string
- /v1/openai/v1/vector_stores/{vector_store_id}/files/{file_id}:
+ /v1/vector_stores/{vector_store_id}/files/{file_id}:
get:
responses:
'200':
@@ -3416,7 +3416,7 @@ paths:
required: true
schema:
type: string
- /v1/openai/v1/embeddings:
+ /v1/embeddings:
post:
responses:
'200':
@@ -3451,7 +3451,7 @@ paths:
schema:
$ref: '#/components/schemas/OpenaiEmbeddingsRequest'
required: true
- /v1/openai/v1/files:
+ /v1/files:
get:
responses:
'200':
@@ -3572,31 +3572,7 @@ paths:
- expires_after_anchor
- expires_after_seconds
required: true
- /v1/openai/v1/models:
- get:
- responses:
- '200':
- description: A OpenAIListModelsResponse.
- content:
- application/json:
- schema:
- $ref: '#/components/schemas/OpenAIListModelsResponse'
- '400':
- $ref: '#/components/responses/BadRequest400'
- '429':
- $ref: >-
- #/components/responses/TooManyRequests429
- '500':
- $ref: >-
- #/components/responses/InternalServerError500
- default:
- $ref: '#/components/responses/DefaultError'
- tags:
- - Models
- summary: List models using the OpenAI API.
- description: List models using the OpenAI API.
- parameters: []
- /v1/openai/v1/files/{file_id}/content:
+ /v1/files/{file_id}/content:
get:
responses:
'200':
@@ -3630,7 +3606,7 @@ paths:
required: true
schema:
type: string
- /v1/openai/v1/vector_stores/{vector_store_id}/files/{file_id}/content:
+ /v1/vector_stores/{vector_store_id}/files/{file_id}/content:
get:
responses:
'200':
@@ -3670,7 +3646,7 @@ paths:
required: true
schema:
type: string
- /v1/openai/v1/vector_stores/{vector_store_id}/search:
+ /v1/vector_stores/{vector_store_id}/search:
post:
responses:
'200':
@@ -4098,7 +4074,7 @@ paths:
schema:
$ref: '#/components/schemas/RunEvalRequest'
required: true
- /v1/openai/v1/moderations:
+ /v1/moderations:
post:
responses:
'200':
diff --git a/llama_stack/apis/vector_io/vector_io.py b/llama_stack/apis/vector_io/vector_io.py
index 6371880ed..cea2a6917 100644
--- a/llama_stack/apis/vector_io/vector_io.py
+++ b/llama_stack/apis/vector_io/vector_io.py
@@ -625,9 +625,7 @@ class VectorIO(Protocol):
"""
...
- @webmethod(
- route="/vector_stores/{vector_store_id}/files/{file_id}", method="GET", level=LLAMA_STACK_API_V1
- )
+ @webmethod(route="/vector_stores/{vector_store_id}/files/{file_id}", method="GET", level=LLAMA_STACK_API_V1)
async def openai_retrieve_vector_store_file(
self,
vector_store_id: str,
@@ -659,9 +657,7 @@ class VectorIO(Protocol):
"""
...
- @webmethod(
- route="/vector_stores/{vector_store_id}/files/{file_id}", method="POST", level=LLAMA_STACK_API_V1
- )
+ @webmethod(route="/vector_stores/{vector_store_id}/files/{file_id}", method="POST", level=LLAMA_STACK_API_V1)
async def openai_update_vector_store_file(
self,
vector_store_id: str,
@@ -677,9 +673,7 @@ class VectorIO(Protocol):
"""
...
- @webmethod(
- route="/vector_stores/{vector_store_id}/files/{file_id}", method="DELETE", level=LLAMA_STACK_API_V1
- )
+ @webmethod(route="/vector_stores/{vector_store_id}/files/{file_id}", method="DELETE", level=LLAMA_STACK_API_V1)
async def openai_delete_vector_store_file(
self,
vector_store_id: str,