build(model_prices_and_context_window.json): add mistral-large on vertex ai pricing

This commit is contained in:
Krrish Dholakia 2024-07-27 10:32:38 -07:00
parent 3f39e61b15
commit 2719860c46
4 changed files with 40 additions and 13 deletions

View file

@ -2028,6 +2028,16 @@
"mode": "chat",
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models"
},
"vertex_ai/mistral-large@2407": {
"max_tokens": 8191,
"max_input_tokens": 128000,
"max_output_tokens": 8191,
"input_cost_per_token": 0.000003,
"output_cost_per_token": 0.000009,
"litellm_provider": "vertex_ai-mistral_models",
"mode": "chat",
"supports_function_calling": true
},
"vertex_ai/imagegeneration@006": {
"cost_per_image": 0.020,
"litellm_provider": "vertex_ai-image-models",
@ -2994,7 +3004,8 @@
"input_cost_per_token": 0.000008,
"output_cost_per_token": 0.000024,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"mistral.mistral-large-2407-v1:0": {
"max_tokens": 8191,
@ -3003,7 +3014,8 @@
"input_cost_per_token": 0.000003,
"output_cost_per_token": 0.000009,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1": {
"max_tokens": 8191,
@ -3075,7 +3087,8 @@
"input_cost_per_token": 0.000008,
"output_cost_per_token": 0.000024,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"bedrock/eu-west-3/mistral.mistral-large-2402-v1:0": {
"max_tokens": 8191,
@ -3084,7 +3097,8 @@
"input_cost_per_token": 0.0000104,
"output_cost_per_token": 0.0000312,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"anthropic.claude-3-sonnet-20240229-v1:0": {
"max_tokens": 4096,

View file

@ -1,6 +1,5 @@
model_list:
- model_name: "llama3.1"
- model_name: "*"
litellm_params:
model: "ollama_chat/llama3.1"
model_info:
supports_function_calling: true
model: "*"

View file

@ -10,7 +10,6 @@ import json
import os
from typing import Optional
import jwt
from cryptography import x509
from cryptography.hazmat.backends import default_backend
from cryptography.hazmat.primitives import serialization
@ -195,6 +194,7 @@ class JWTHandler:
if audience is None:
decode_options = {"verify_aud": False}
import jwt
from jwt.algorithms import RSAAlgorithm
header = jwt.get_unverified_header(token)

View file

@ -2028,6 +2028,16 @@
"mode": "chat",
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models"
},
"vertex_ai/mistral-large@2407": {
"max_tokens": 8191,
"max_input_tokens": 128000,
"max_output_tokens": 8191,
"input_cost_per_token": 0.000003,
"output_cost_per_token": 0.000009,
"litellm_provider": "vertex_ai-mistral_models",
"mode": "chat",
"supports_function_calling": true
},
"vertex_ai/imagegeneration@006": {
"cost_per_image": 0.020,
"litellm_provider": "vertex_ai-image-models",
@ -2994,7 +3004,8 @@
"input_cost_per_token": 0.000008,
"output_cost_per_token": 0.000024,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"mistral.mistral-large-2407-v1:0": {
"max_tokens": 8191,
@ -3003,7 +3014,8 @@
"input_cost_per_token": 0.000003,
"output_cost_per_token": 0.000009,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1": {
"max_tokens": 8191,
@ -3075,7 +3087,8 @@
"input_cost_per_token": 0.000008,
"output_cost_per_token": 0.000024,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"bedrock/eu-west-3/mistral.mistral-large-2402-v1:0": {
"max_tokens": 8191,
@ -3084,7 +3097,8 @@
"input_cost_per_token": 0.0000104,
"output_cost_per_token": 0.0000312,
"litellm_provider": "bedrock",
"mode": "chat"
"mode": "chat",
"supports_function_calling": true
},
"anthropic.claude-3-sonnet-20240229-v1:0": {
"max_tokens": 4096,