Add Groq provider - chat completions

2025-12-17 18:32:41 +00:00 · 2024-12-12 21:15:09 +11:00 · 2024-12-12 21:15:09 +11:00 · 378150e23c
commit 378150e23c
parent c294a01c4b
10 changed files with 727 additions and 31 deletions
--- a/llama_stack/providers/tests/inference/fixtures.py
+++ b/llama_stack/providers/tests/inference/fixtures.py
@ -19,6 +19,7 @@ from llama_stack.providers.remote.inference.bedrock import BedrockConfig

 from llama_stack.providers.remote.inference.cerebras import CerebrasImplConfig
 from llama_stack.providers.remote.inference.fireworks import FireworksImplConfig
+from llama_stack.providers.remote.inference.groq import GroqConfig
 from llama_stack.providers.remote.inference.nvidia import NVIDIAConfig
 from llama_stack.providers.remote.inference.ollama import OllamaImplConfig
 from llama_stack.providers.remote.inference.tgi import TGIImplConfig
@ -150,6 +151,22 @@ def inference_together() -> ProviderFixture:
    )


+@pytest.fixture(scope="session")
+def inference_groq() -> ProviderFixture:
+    return ProviderFixture(
+        providers=[
+            Provider(
+                provider_id="groq",
+                provider_type="remote::groq",
+                config=GroqConfig().model_dump(),
+            )
+        ],
+        provider_data=dict(
+            groq_api_key=get_env_or_fail("GROQ_API_KEY"),
+        ),
+    )
+
+
@pytest.fixture(scope="session")
 def inference_bedrock() -> ProviderFixture:
    return ProviderFixture(
@ -222,6 +239,7 @@ INFERENCE_FIXTURES = [
    "ollama",
    "fireworks",
    "together",
+    "groq",
    "vllm_remote",
    "remote",
    "bedrock",