Merge pull request #5221 from kiriloman/adjust-pricing-file

[PRICING] Use specific llama2 and llama3 model names in Ollama
This commit is contained in:
Krish Dholakia 2024-08-17 14:03:20 -07:00 committed by GitHub
commit 5731287f1b
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -4201,6 +4201,15 @@
"litellm_provider": "ollama", "litellm_provider": "ollama",
"mode": "completion" "mode": "completion"
}, },
"ollama/llama2:7b": {
"max_tokens": 4096,
"max_input_tokens": 4096,
"max_output_tokens": 4096,
"input_cost_per_token": 0.0,
"output_cost_per_token": 0.0,
"litellm_provider": "ollama",
"mode": "completion"
},
"ollama/llama2:13b": { "ollama/llama2:13b": {
"max_tokens": 4096, "max_tokens": 4096,
"max_input_tokens": 4096, "max_input_tokens": 4096,
@ -4237,6 +4246,15 @@
"litellm_provider": "ollama", "litellm_provider": "ollama",
"mode": "chat" "mode": "chat"
}, },
"ollama/llama3:8b": {
"max_tokens": 8192,
"max_input_tokens": 8192,
"max_output_tokens": 8192,
"input_cost_per_token": 0.0,
"output_cost_per_token": 0.0,
"litellm_provider": "ollama",
"mode": "chat"
},
"ollama/llama3:70b": { "ollama/llama3:70b": {
"max_tokens": 8192, "max_tokens": 8192,
"max_input_tokens": 8192, "max_input_tokens": 8192,