From 73b51308d3600d266cd88d78adeebdc09f5d45e0 Mon Sep 17 00:00:00 2001 From: seyeong-han Date: Sun, 24 Nov 2024 01:31:47 -0600 Subject: [PATCH] fix: model to model_id --- .../providers/remote/inference/ssambanova/ssambanova.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/llama_stack/providers/remote/inference/ssambanova/ssambanova.py b/llama_stack/providers/remote/inference/ssambanova/ssambanova.py index c25e5ffe5..39e2abf34 100644 --- a/llama_stack/providers/remote/inference/ssambanova/ssambanova.py +++ b/llama_stack/providers/remote/inference/ssambanova/ssambanova.py @@ -74,7 +74,7 @@ class SsambanovaInferenceAdapter(ModelRegistryHelper, Inference): async def completion( self, - model: str, + model_id: str, content: InterleavedTextMedia, sampling_params: Optional[SamplingParams] = SamplingParams(), response_format: Optional[ResponseFormat] = None, @@ -85,7 +85,7 @@ class SsambanovaInferenceAdapter(ModelRegistryHelper, Inference): async def chat_completion( self, - model: str, + model_id: str, messages: List[Message], sampling_params: Optional[SamplingParams] = SamplingParams(), response_format: Optional[ResponseFormat] = None, @@ -96,7 +96,7 @@ class SsambanovaInferenceAdapter(ModelRegistryHelper, Inference): logprobs: Optional[LogProbConfig] = None, ) -> AsyncGenerator: request = ChatCompletionRequest( - model=model, + model=model_id, messages=messages, sampling_params=sampling_params, tools=tools or [], @@ -147,7 +147,7 @@ class SsambanovaInferenceAdapter(ModelRegistryHelper, Inference): async def embeddings( self, - model: str, + model_id: str, contents: List[InterleavedTextMedia], ) -> EmbeddingsResponse: raise NotImplementedError()