From 1f52582aac38cf1fc82ec154c66788b8314535ee Mon Sep 17 00:00:00 2001 From: Yuan Tang Date: Thu, 13 Feb 2025 11:09:40 -0500 Subject: [PATCH] Update groq.py --- llama_stack/providers/remote/inference/groq/groq.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/llama_stack/providers/remote/inference/groq/groq.py b/llama_stack/providers/remote/inference/groq/groq.py index 87c4d0d00..9b3c1abbf 100644 --- a/llama_stack/providers/remote/inference/groq/groq.py +++ b/llama_stack/providers/remote/inference/groq/groq.py @@ -65,7 +65,7 @@ _MODEL_ALIASES = [ # TODO(aidand): Replace this with a stable model once Groq supports it build_model_alias( "llama-3.2-3b-preview", - CoreModelId.llama3_2_3b.value, + CoreModelId.llama3_2_3b_instruct.value, ), ] @@ -105,9 +105,10 @@ class GroqInferenceAdapter(Inference, ModelRegistryHelper, NeedsRequestProviderD model_id = self.get_provider_model_id(model_id) if model_id == "llama-3.2-3b-preview": warnings.warn( - "Groq only contains a preview version for llama-3.2-3b. " + "Groq only contains a preview version for llama-3.2-3b-instruct. " "Preview models aren't recommended for production use. " "They can be discontinued on short notice." + "More details: https://console.groq.com/docs/models" ) request = convert_chat_completion_request(