mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-19 04:29:40 +00:00
add chat completion support for JsonSchemaResponseFormat request_format
This commit is contained in:
parent
a6f47f1090
commit
e6b82a44eb
3 changed files with 18 additions and 0 deletions
|
|
@ -159,6 +159,7 @@ class NVIDIAInferenceAdapter(Inference, ModelRegistryHelper):
|
|||
model=self.get_provider_model_id(model_id),
|
||||
messages=messages,
|
||||
sampling_params=sampling_params,
|
||||
response_format=response_format,
|
||||
tools=tools,
|
||||
tool_choice=tool_choice,
|
||||
tool_prompt_format=tool_prompt_format,
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue