diff --git a/docs/my-website/docs/providers/groq.md b/docs/my-website/docs/providers/groq.md index 4a2888312..e09cf9f8a 100644 --- a/docs/my-website/docs/providers/groq.md +++ b/docs/my-website/docs/providers/groq.md @@ -1,6 +1,8 @@ # Groq https://groq.com/ +**We support ALL Groq models, just set `groq/` as a prefix when sending completion requests** + ## API Key ```python # env variable @@ -47,3 +49,4 @@ We support ALL Groq models, just set `groq/` as a prefix when sending completion | Model Name | Function Call | |--------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------| | llama2-70b-4096 | `completion(model="groq/llama2-70b-4096", messages)` | +| mixtral-8x7b-32768 | `completion(model="groq/mixtral-8x7b-32768", messages)` | diff --git a/litellm/model_prices_and_context_window_backup.json b/litellm/model_prices_and_context_window_backup.json index 15b969980..4870025cb 100644 --- a/litellm/model_prices_and_context_window_backup.json +++ b/litellm/model_prices_and_context_window_backup.json @@ -580,6 +580,20 @@ "litellm_provider": "mistral", "mode": "embedding" }, + "groq/llama2-70b-4096": { + "max_tokens": 4096, + "input_cost_per_token": 0.00000070, + "output_cost_per_token": 0.00000080, + "litellm_provider": "groq", + "mode": "chat" + }, + "groq/mixtral-8x7b-32768": { + "max_tokens": 32768, + "input_cost_per_token": 0.00000027, + "output_cost_per_token": 0.00000027, + "litellm_provider": "groq", + "mode": "chat" + }, "claude-instant-1.2": { "max_tokens": 100000, "max_output_tokens": 8191, diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index 15b969980..4870025cb 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -580,6 +580,20 @@ "litellm_provider": "mistral", "mode": "embedding" }, + "groq/llama2-70b-4096": { + "max_tokens": 4096, + "input_cost_per_token": 0.00000070, + "output_cost_per_token": 0.00000080, + "litellm_provider": "groq", + "mode": "chat" + }, + "groq/mixtral-8x7b-32768": { + "max_tokens": 32768, + "input_cost_per_token": 0.00000027, + "output_cost_per_token": 0.00000027, + "litellm_provider": "groq", + "mode": "chat" + }, "claude-instant-1.2": { "max_tokens": 100000, "max_output_tokens": 8191,