test

# What does this PR do? ## Test Plan
2025-12-06 10:37:22 +00:00 · 2025-10-08 13:23:21 -07:00 · 2025-10-08 13:23:21 -07:00 · 1e891489a8
commit 1e891489a8
parent 96886afaca
13 changed files with 170 additions and 4 deletions
--- a/llama_stack/core/routers/inference.py
+++ b/llama_stack/core/routers/inference.py
@ -277,6 +277,7 @@ class InferenceRouter(Inference):
        top_logprobs: int | None = None,
        top_p: float | None = None,
        user: str | None = None,
+        **kwargs: Any,
    ) -> OpenAIChatCompletion | AsyncIterator[OpenAIChatCompletionChunk]:
        logger.debug(
            f"InferenceRouter.openai_chat_completion: {model=}, {stream=}, {messages=}",
@ -323,6 +324,7 @@ class InferenceRouter(Inference):
            top_logprobs=top_logprobs,
            top_p=top_p,
            user=user,
+            **kwargs,
        )
        provider = await self.routing_table.get_provider_impl(model_obj.identifier)
        if stream: