minor fix

This commit is contained in:
Jinan Zhou 2024-11-20 23:41:36 +00:00
parent 111e32ffe5
commit f2ac4e2a94

View file

@ -73,8 +73,9 @@ class NutanixInferenceAdapter(ModelRegistryHelper, Inference):
stream: Optional[bool] = False, stream: Optional[bool] = False,
logprobs: Optional[LogProbConfig] = None, logprobs: Optional[LogProbConfig] = None,
) -> AsyncGenerator: ) -> AsyncGenerator:
model = await self.model_store.get_model(model_id)
request = ChatCompletionRequest( request = ChatCompletionRequest(
model=model, model=model.provider_resource_id,
messages=messages, messages=messages,
sampling_params=sampling_params, sampling_params=sampling_params,
tools=tools or [], tools=tools or [],