In progress: Add NVIDIA e2e notebook

This commit is contained in:
Jash Gulabrai 2025-04-03 11:19:43 -04:00
parent 66d6c2580e
commit 861962fa80
18 changed files with 4888 additions and 7 deletions

View file

@ -243,7 +243,7 @@ class NVIDIAInferenceAdapter(Inference, ModelRegistryHelper):
provider_model_id = self.get_provider_model_id(model_id)
request = await convert_chat_completion_request(
request=ChatCompletionRequest(
model=self.get_provider_model_id(model_id),
model=provider_model_id,
messages=messages,
sampling_params=sampling_params,
response_format=response_format,