Update Groq models on model_prices_and_context_window.json

Add support for 6 new models; add deprecations dates to 12 model; and update context-windows/max-tokens for 3 models
This commit is contained in:
naliotopier 2025-04-16 14:19:38 -07:00
parent ef80d25f16
commit 2f9dd03b2a

View file

@ -3423,25 +3423,24 @@
"supports_prompt_caching": true "supports_prompt_caching": true
}, },
"groq/deepseek-r1-distill-llama-70b": { "groq/deepseek-r1-distill-llama-70b": {
"max_tokens": 131072, "max_tokens": 128000,
"max_input_tokens": 131072, "max_input_tokens": 128000,
"max_output_tokens": 131072, "max_output_tokens": 128000,
"input_cost_per_token": 0.00000075, "input_cost_per_token": 7.5e-07,
"output_cost_per_token": 0.00000099, "output_cost_per_token": 9.9e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_system_messages": false, "supports_function_calling": true,
"supports_function_calling": false, "supports_response_schema": true,
"supports_reasoning": true, "supports_reasoning": true,
"supports_response_schema": false,
"supports_tool_choice": true "supports_tool_choice": true
}, },
"groq/llama-3.3-70b-versatile": { "groq/llama-3.3-70b-versatile": {
"max_tokens": 8192, "max_tokens": 32768,
"max_input_tokens": 128000, "max_input_tokens": 128000,
"max_output_tokens": 8192, "max_output_tokens": 32768,
"input_cost_per_token": 0.00000059, "input_cost_per_token": 5.9e-07,
"output_cost_per_token": 0.00000079, "output_cost_per_token": 7.900000000000001e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
@ -3452,11 +3451,21 @@
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000059, "input_cost_per_token": 5.9e-07,
"output_cost_per_token": 0.00000099, "output_cost_per_token": 9.9e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2025-04-14"
},
"groq/llama-guard-3-8b": {
"max_tokens": 8192,
"max_input_tokens": 8192,
"max_output_tokens": 8192,
"input_cost_per_token": 2.0000000000000002e-07,
"output_cost_per_token": 2.0000000000000002e-07,
"litellm_provider": "groq",
"mode": "chat"
}, },
"groq/llama2-70b-4096": { "groq/llama2-70b-4096": {
"max_tokens": 4096, "max_tokens": 4096,
@ -3474,106 +3483,106 @@
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000005, "input_cost_per_token": 5.0000000000000004e-08,
"output_cost_per_token": 0.00000008, "output_cost_per_token": 8e-08,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat"
"supports_function_calling": true,
"supports_response_schema": true,
"supports_tool_choice": true
}, },
"groq/llama-3.2-1b-preview": { "groq/llama-3.2-1b-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000004, "input_cost_per_token": 4e-08,
"output_cost_per_token": 0.00000004, "output_cost_per_token": 4e-08,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2025-04-14"
}, },
"groq/llama-3.2-3b-preview": { "groq/llama-3.2-3b-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000006, "input_cost_per_token": 6e-08,
"output_cost_per_token": 0.00000006, "output_cost_per_token": 6e-08,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2025-04-14"
}, },
"groq/llama-3.2-11b-text-preview": { "groq/llama-3.2-11b-text-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000018, "input_cost_per_token": 1.8e-07,
"output_cost_per_token": 0.00000018, "output_cost_per_token": 1.8e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2024-10-28"
}, },
"groq/llama-3.2-11b-vision-preview": { "groq/llama-3.2-11b-vision-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000018, "input_cost_per_token": 1.8e-07,
"output_cost_per_token": 0.00000018, "output_cost_per_token": 1.8e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_vision": true, "supports_vision": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2025-04-14"
}, },
"groq/llama-3.2-90b-text-preview": { "groq/llama-3.2-90b-text-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.0000009, "input_cost_per_token": 9e-07,
"output_cost_per_token": 0.0000009, "output_cost_per_token": 9e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2024-11-25"
}, },
"groq/llama-3.2-90b-vision-preview": { "groq/llama-3.2-90b-vision-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.0000009, "input_cost_per_token": 9e-07,
"output_cost_per_token": 0.0000009, "output_cost_per_token": 9e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_vision": true, "supports_vision": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2025-04-14"
}, },
"groq/llama3-70b-8192": { "groq/llama3-70b-8192": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000059, "input_cost_per_token": 5.9e-07,
"output_cost_per_token": 0.00000079, "output_cost_per_token": 7.900000000000001e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat"
"supports_function_calling": true,
"supports_response_schema": true,
"supports_tool_choice": true
}, },
"groq/llama-3.1-8b-instant": { "groq/llama-3.1-8b-instant": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 128000,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000005, "input_cost_per_token": 5.0000000000000004e-08,
"output_cost_per_token": 0.00000008, "output_cost_per_token": 8e-08,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
@ -3584,13 +3593,14 @@
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000059, "input_cost_per_token": 5.9e-07,
"output_cost_per_token": 0.00000079, "output_cost_per_token": 7.9e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2025-01-24"
}, },
"groq/llama-3.1-405b-reasoning": { "groq/llama-3.1-405b-reasoning": {
"max_tokens": 8192, "max_tokens": 8192,
@ -3604,83 +3614,141 @@
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true
}, },
"groq/mixtral-8x7b-32768": { "groq/meta-llama/llama-4-scout-17b-16e-instruct": {
"max_tokens": 32768, "max_tokens": 8192,
"max_input_tokens": 32768, "max_input_tokens": 131072,
"max_output_tokens": 32768, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000024, "input_cost_per_token": 1.1e-07,
"output_cost_per_token": 0.00000024, "output_cost_per_token": 3.4000000000000003e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true
}, },
"groq/meta-llama/llama-4-maverick-17b-128e-instruct": {
"max_tokens": 8192,
"max_input_tokens": 131072,
"max_output_tokens": 8192,
"input_cost_per_token": 2.0000000000000002e-07,
"output_cost_per_token": 6e-07,
"litellm_provider": "groq",
"mode": "chat",
"supports_function_calling": true,
"supports_response_schema": true,
"supports_tool_choice": true
},
"groq/mistral-saba-24b": {
"max_tokens": 32000,
"max_input_tokens": 32000,
"max_output_tokens": 32000,
"input_cost_per_token": 7.900000000000001e-07,
"output_cost_per_token": 7.900000000000001e-07,
"litellm_provider": "groq",
"mode": "chat"
},
"groq/mixtral-8x7b-32768": {
"max_tokens": 32768,
"max_input_tokens": 32768,
"max_output_tokens": 32768,
"input_cost_per_token": 2.4e-07,
"output_cost_per_token": 2.4e-07,
"litellm_provider": "groq",
"mode": "chat",
"supports_function_calling": true,
"supports_response_schema": true,
"supports_tool_choice": true,
"deprecation_date": "2025-03-20"
},
"groq/gemma-7b-it": { "groq/gemma-7b-it": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000007, "input_cost_per_token": 7e-08,
"output_cost_per_token": 0.00000007, "output_cost_per_token": 7e-08,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2024-12-18"
}, },
"groq/gemma2-9b-it": { "groq/gemma2-9b-it": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000020, "input_cost_per_token": 2.0000000000000002e-07,
"output_cost_per_token": 0.00000020, "output_cost_per_token": 2.0000000000000002e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": false,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": false
}, },
"groq/llama3-groq-70b-8192-tool-use-preview": { "groq/llama3-groq-70b-8192-tool-use-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000089, "input_cost_per_token": 8.9e-07,
"output_cost_per_token": 0.00000089, "output_cost_per_token": 8.9e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true "supports_tool_choice": true,
"deprecation_date": "2025-1-6"
}, },
"groq/llama3-groq-8b-8192-tool-use-preview": { "groq/llama3-groq-8b-8192-tool-use-preview": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,
"max_output_tokens": 8192, "max_output_tokens": 8192,
"input_cost_per_token": 0.00000019, "input_cost_per_token": 1.9e-07,
"output_cost_per_token": 0.00000019, "output_cost_per_token": 1.9e-07,
"litellm_provider": "groq", "litellm_provider": "groq",
"mode": "chat", "mode": "chat",
"supports_function_calling": true, "supports_function_calling": true,
"supports_response_schema": true, "supports_response_schema": true,
"supports_tool_choice": true,
"deprecation_date": "2025-1-6"
},
"groq/qwen-qwq-32b": {
"max_tokens": 128000,
"max_input_tokens": 128000,
"max_output_tokens": 128000,
"input_cost_per_token": 2.9e-07,
"output_cost_per_token": 3.9e-07,
"litellm_provider": "groq",
"mode": "chat",
"supports_function_calling": true,
"supports_response_schema": true,
"supports_reasoning": true,
"supports_tool_choice": true "supports_tool_choice": true
}, },
"groq/playai-tts": {
"max_tokens": 10000,
"max_input_tokens": 10000,
"max_output_tokens": 10000,
"input_cost_per_character": 5e-05,
"litellm_provider": "groq",
"mode": "audio_speech"
},
"groq/whisper-large-v3": { "groq/whisper-large-v3": {
"mode": "audio_transcription", "input_cost_per_second": 3.0833333333333335e-05,
"input_cost_per_second": 0.00003083, "output_cost_per_second": 0.0,
"output_cost_per_second": 0, "litellm_provider": "groq",
"litellm_provider": "groq" "mode": "audio_transcription"
}, },
"groq/whisper-large-v3-turbo": { "groq/whisper-large-v3-turbo": {
"mode": "audio_transcription", "input_cost_per_second": 1.1111111111111112e-05,
"input_cost_per_second": 0.00001111, "output_cost_per_second": 0.0,
"output_cost_per_second": 0, "litellm_provider": "groq",
"litellm_provider": "groq" "mode": "audio_transcription"
}, },
"groq/distil-whisper-large-v3-en": { "groq/distil-whisper-large-v3-en": {
"mode": "audio_transcription", "input_cost_per_second": 5.555555555555556e-06,
"input_cost_per_second": 0.00000556, "output_cost_per_second": 0.0,
"output_cost_per_second": 0, "litellm_provider": "groq",
"litellm_provider": "groq" "mode": "audio_transcription"
}, },
"cerebras/llama3.1-8b": { "cerebras/llama3.1-8b": {
"max_tokens": 128000, "max_tokens": 128000,