[Feat] add fireworks llama 3.2 models + cost tracking (#5905)

* add fireworks llama 3.2 vision models * add new llama3.2 models * docs add new llama 3.2 vision models
2024-09-25 17:59:46 -07:00 · 2024-09-25 17:59:46 -07:00 · a8dd495eae
commit a8dd495eae
parent 4bdeefd7e4
3 changed files with 96 additions and 0 deletions
--- a/docs/my-website/docs/providers/fireworks_ai.md
+++ b/docs/my-website/docs/providers/fireworks_ai.md
@ -148,6 +148,10 @@ We support ALL Fireworks AI models, just set `fireworks_ai/` as a prefix when se

 | Model Name               | Function Call                                                                                                                                                      |
 |--------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| llama-v3p2-1b-instruct | `completion(model="fireworks_ai/llama-v3p2-1b-instruct", messages)` |
+| llama-v3p2-3b-instruct | `completion(model="fireworks_ai/llama-v3p2-3b-instruct", messages)` |
+| llama-v3p2-11b-vision-instruct | `completion(model="fireworks_ai/llama-v3p2-11b-vision-instruct", messages)` |
+| llama-v3p2-90b-vision-instruct | `completion(model="fireworks_ai/llama-v3p2-90b-vision-instruct", messages)` |
 | mixtral-8x7b-instruct | `completion(model="fireworks_ai/mixtral-8x7b-instruct", messages)` | 
 | firefunction-v1 | `completion(model="fireworks_ai/firefunction-v1", messages)` |
 | llama-v2-70b-chat | `completion(model="fireworks_ai/llama-v2-70b-chat", messages)` |  
--- a/litellm/model_prices_and_context_window_backup.json
+++ b/litellm/model_prices_and_context_window_backup.json
@ -5473,6 +5473,52 @@
        "litellm_provider": "perplexity",
        "mode": "chat"
    },
+    "fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000001, 
+        "output_cost_per_token": 0.0000001,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "source": "https://fireworks.ai/pricing"
+    },
+    "fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000001, 
+        "output_cost_per_token": 0.0000001,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "source": "https://fireworks.ai/pricing"
+    },
+    "fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000002, 
+        "output_cost_per_token": 0.0000002,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "supports_vision": true,
+        "source": "https://fireworks.ai/pricing"
+    },
+    "accounts/fireworks/models/llama-v3p2-90b-vision-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000009, 
+        "output_cost_per_token": 0.0000009,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "supports_vision": true,
+        "source": "https://fireworks.ai/pricing"
+    },
    "fireworks_ai/accounts/fireworks/models/firefunction-v2": {
        "max_tokens": 8192,
        "max_input_tokens": 8192,
--- a/model_prices_and_context_window.json
+++ b/model_prices_and_context_window.json
@ -5473,6 +5473,52 @@
        "litellm_provider": "perplexity",
        "mode": "chat"
    },
+    "fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000001, 
+        "output_cost_per_token": 0.0000001,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "source": "https://fireworks.ai/pricing"
+    },
+    "fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000001, 
+        "output_cost_per_token": 0.0000001,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "source": "https://fireworks.ai/pricing"
+    },
+    "fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000002, 
+        "output_cost_per_token": 0.0000002,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "supports_vision": true,
+        "source": "https://fireworks.ai/pricing"
+    },
+    "accounts/fireworks/models/llama-v3p2-90b-vision-instruct": {
+        "max_tokens": 16384,
+        "max_input_tokens": 16384,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 0.0000009, 
+        "output_cost_per_token": 0.0000009,
+        "litellm_provider": "fireworks_ai", 
+        "mode": "chat",
+        "supports_function_calling": true,
+        "supports_vision": true,
+        "source": "https://fireworks.ai/pricing"
+    },
    "fireworks_ai/accounts/fireworks/models/firefunction-v2": {
        "max_tokens": 8192,
        "max_input_tokens": 8192,