mirror of
https://github.com/meta-llama/llama-stack.git
synced 2026-01-02 04:10:01 +00:00
nvdia fix
This commit is contained in:
parent
965644ce68
commit
5cce5a1f78
5 changed files with 355 additions and 262 deletions
|
|
@ -279,7 +279,6 @@ def convert_chat_completion_request(
|
|||
nvext.update(top_k=strategy.top_k)
|
||||
elif isinstance(strategy, GreedySamplingStrategy):
|
||||
nvext.update(top_k=-1)
|
||||
payload.update(temperature=strategy.temperature)
|
||||
else:
|
||||
raise ValueError(f"Unsupported sampling strategy: {strategy}")
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue