nvdia fix

This commit is contained in:
Xi Yan 2025-01-15 17:26:31 -08:00
parent 965644ce68
commit 5cce5a1f78
5 changed files with 355 additions and 262 deletions

View file

@ -279,7 +279,6 @@ def convert_chat_completion_request(
nvext.update(top_k=strategy.top_k)
elif isinstance(strategy, GreedySamplingStrategy):
nvext.update(top_k=-1)
payload.update(temperature=strategy.temperature)
else:
raise ValueError(f"Unsupported sampling strategy: {strategy}")