minor fix

This commit is contained in:
Jinan Zhou 2024-11-20 23:41:36 +00:00
parent 111e32ffe5
commit f2ac4e2a94

View file

@ -73,8 +73,9 @@ class NutanixInferenceAdapter(ModelRegistryHelper, Inference):
stream: Optional[bool] = False,
logprobs: Optional[LogProbConfig] = None,
) -> AsyncGenerator:
model = await self.model_store.get_model(model_id)
request = ChatCompletionRequest(
model=model,
model=model.provider_resource_id,
messages=messages,
sampling_params=sampling_params,
tools=tools or [],