[Feat] add fireworks llama 3.2 models + cost tracking (#5905)

* add fireworks llama 3.2 vision models

* add new llama3.2 models

* docs add new llama 3.2 vision models
This commit is contained in:
Ishaan Jaff 2024-09-25 17:59:46 -07:00 committed by GitHub
parent 4bdeefd7e4
commit a8dd495eae
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
3 changed files with 96 additions and 0 deletions

View file

@ -148,6 +148,10 @@ We support ALL Fireworks AI models, just set `fireworks_ai/` as a prefix when se
| Model Name | Function Call |
|--------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------|
| llama-v3p2-1b-instruct | `completion(model="fireworks_ai/llama-v3p2-1b-instruct", messages)` |
| llama-v3p2-3b-instruct | `completion(model="fireworks_ai/llama-v3p2-3b-instruct", messages)` |
| llama-v3p2-11b-vision-instruct | `completion(model="fireworks_ai/llama-v3p2-11b-vision-instruct", messages)` |
| llama-v3p2-90b-vision-instruct | `completion(model="fireworks_ai/llama-v3p2-90b-vision-instruct", messages)` |
| mixtral-8x7b-instruct | `completion(model="fireworks_ai/mixtral-8x7b-instruct", messages)` |
| firefunction-v1 | `completion(model="fireworks_ai/firefunction-v1", messages)` |
| llama-v2-70b-chat | `completion(model="fireworks_ai/llama-v2-70b-chat", messages)` |

View file

@ -5473,6 +5473,52 @@
"litellm_provider": "perplexity",
"mode": "chat"
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000001,
"output_cost_per_token": 0.0000001,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"source": "https://fireworks.ai/pricing"
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000001,
"output_cost_per_token": 0.0000001,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"source": "https://fireworks.ai/pricing"
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000002,
"output_cost_per_token": 0.0000002,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_vision": true,
"source": "https://fireworks.ai/pricing"
},
"accounts/fireworks/models/llama-v3p2-90b-vision-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000009,
"output_cost_per_token": 0.0000009,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_vision": true,
"source": "https://fireworks.ai/pricing"
},
"fireworks_ai/accounts/fireworks/models/firefunction-v2": {
"max_tokens": 8192,
"max_input_tokens": 8192,

View file

@ -5473,6 +5473,52 @@
"litellm_provider": "perplexity",
"mode": "chat"
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000001,
"output_cost_per_token": 0.0000001,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"source": "https://fireworks.ai/pricing"
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000001,
"output_cost_per_token": 0.0000001,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"source": "https://fireworks.ai/pricing"
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000002,
"output_cost_per_token": 0.0000002,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_vision": true,
"source": "https://fireworks.ai/pricing"
},
"accounts/fireworks/models/llama-v3p2-90b-vision-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 0.0000009,
"output_cost_per_token": 0.0000009,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_vision": true,
"source": "https://fireworks.ai/pricing"
},
"fireworks_ai/accounts/fireworks/models/firefunction-v2": {
"max_tokens": 8192,
"max_input_tokens": 8192,