refine

2025-08-11 12:38:02 +00:00 · 2025-03-11 20:46:19 -07:00 · 2025-03-11 20:46:19 -07:00 · 8667b137f6
commit 8667b137f6
parent 3ca640be7f
1 changed files with 5 additions and 0 deletions
--- a/llama_stack/providers/remote/inference/passthrough/passthrough.py
+++ b/llama_stack/providers/remote/inference/passthrough/passthrough.py
@ -159,7 +159,10 @@ class PassthroughInferenceAdapter(Inference):
    async def _nonstream_chat_completion(self, json_params: Dict[str, Any]) -> ChatCompletionResponse:
        client = self._get_client()
        response = await client.inference.chat_completion(**json_params)
+
        response = response.to_dict()
+
+        # temporary hack to remove the metrics from the response
        response["metrics"] = []

        return convert_to_pydantic(ChatCompletionResponse, response)
@ -170,6 +173,8 @@ class PassthroughInferenceAdapter(Inference):

        async for chunk in stream_response:
            chunk = chunk.to_dict()
+
+            # temporary hack to remove the metrics from the response
            chunk["metrics"] = []
            chunk = convert_to_pydantic(ChatCompletionResponseStreamChunk, chunk)
            yield chunk