completion() for tgi (#295)

2024-10-24 16:02:41 -07:00 · 2024-10-24 16:02:41 -07:00 · 3e1c3fdb3f
commit 3e1c3fdb3f
parent cb84034567
9 changed files with 173 additions and 35 deletions
--- a/llama_stack/providers/adapters/inference/together/together.py
+++ b/llama_stack/providers/adapters/inference/together/together.py
@ -131,7 +131,7 @@ class TogetherInferenceAdapter(
            yield chunk

    def _get_params(self, request: ChatCompletionRequest) -> dict:
-        options = get_sampling_options(request)
+        options = get_sampling_options(request.sampling_params)
        if fmt := request.response_format:
            if fmt.type == ResponseFormatType.json_schema.value:
                options["response_format"] = {