mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-24 18:24:20 +00:00
(docs) add deepinfra models + pricing
This commit is contained in:
parent
1e7bae4aea
commit
8251e71a2a
2 changed files with 60 additions and 6 deletions
|
@ -1,5 +1,12 @@
|
||||||
# DeepInfra
|
# DeepInfra
|
||||||
https://deepinfra.com/
|
https://deepinfra.com/
|
||||||
|
|
||||||
|
## API Key
|
||||||
|
```python
|
||||||
|
# env variable
|
||||||
|
os.environ['DEEPINFRA_API_KEY']
|
||||||
|
```
|
||||||
|
|
||||||
## Sample Usage
|
## Sample Usage
|
||||||
```python
|
```python
|
||||||
from litellm import completion
|
from litellm import completion
|
||||||
|
@ -29,10 +36,15 @@ for chunk in response:
|
||||||
```
|
```
|
||||||
|
|
||||||
## Chat Models
|
## Chat Models
|
||||||
| Model Name | Function Call | Required OS Variables |
|
| Model Name | Function Call |
|
||||||
|------------------|--------------------------------------|-------------------------|
|
|------------------|--------------------------------------|
|
||||||
| meta-llama/Llama-2-70b-chat-hf | `completion(model="deepinfra/meta-llama/Llama-2-70b-chat-hf", messages)` | `os.environ['DEEPINFRA_API_KEY']` |
|
| meta-llama/Llama-2-70b-chat-hf | `completion(model="deepinfra/meta-llama/Llama-2-70b-chat-hf", messages)` |
|
||||||
| meta-llama/Llama-2-7b-chat-hf | `completion(model="deepinfra/meta-llama/Llama-2-7b-chat-hf", messages)` | `os.environ['DEEPINFRA_API_KEY']` |
|
| meta-llama/Llama-2-7b-chat-hf | `completion(model="deepinfra/meta-llama/Llama-2-7b-chat-hf", messages)` |
|
||||||
| codellama/CodeLlama-34b-Instruct-hf | `completion(model="deepinfra/codellama/CodeLlama-34b-Instruct-hf", messages)` | `os.environ['DEEPINFRA_API_KEY']` |
|
| meta-llama/Llama-2-13b-chat-hf | `completion(model="deepinfra/meta-llama/Llama-2-13b-chat-hf", messages)` |
|
||||||
|
| codellama/CodeLlama-34b-Instruct-hf | `completion(model="deepinfra/codellama/CodeLlama-34b-Instruct-hf", messages)` |
|
||||||
|
| mistralai/Mistral-7B-Instruct-v0.1 | `completion(model="deepinfra/mistralai/Mistral-7B-Instruct-v0.1", messages)` |
|
||||||
|
| jondurbin/airoboros-l2-70b-gpt4-1.4.1 | `completion(model="deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1", messages)` |
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -570,5 +570,47 @@
|
||||||
"output_cost_per_token": 0.0,
|
"output_cost_per_token": 0.0,
|
||||||
"litellm_provider": "ollama",
|
"litellm_provider": "ollama",
|
||||||
"mode": "completion"
|
"mode": "completion"
|
||||||
}
|
},
|
||||||
|
"deepinfra/meta-llama/Llama-2-70b-chat-hf": {
|
||||||
|
"max_tokens": 6144,
|
||||||
|
"input_cost_per_token": 0.000001875,
|
||||||
|
"output_cost_per_token": 0.000001875,
|
||||||
|
"litellm_provider": "openrouter",
|
||||||
|
"mode": "chat"
|
||||||
|
},
|
||||||
|
"deepinfra/codellama/CodeLlama-34b-Instruct-hf": {
|
||||||
|
"max_tokens": 4096,
|
||||||
|
"input_cost_per_token": 0.0000006,
|
||||||
|
"output_cost_per_token": 0.0000006,
|
||||||
|
"litellm_provider": "deepinfra",
|
||||||
|
"mode": "chat"
|
||||||
|
},
|
||||||
|
"deepinfra/meta-llama/Llama-2-13b-chat-hf": {
|
||||||
|
"max_tokens": 4096,
|
||||||
|
"input_cost_per_token": 0.00000035,
|
||||||
|
"output_cost_per_token": 0.00000035,
|
||||||
|
"litellm_provider": "deepinfra",
|
||||||
|
"mode": "chat"
|
||||||
|
},
|
||||||
|
"deepinfra/meta-llama/Llama-2-7b-chat-hf": {
|
||||||
|
"max_tokens": 4096,
|
||||||
|
"input_cost_per_token": 0.0000002,
|
||||||
|
"output_cost_per_token": 0.0000002,
|
||||||
|
"litellm_provider": "deepinfra",
|
||||||
|
"mode": "chat"
|
||||||
|
},
|
||||||
|
"deepinfra/mistralai/Mistral-7B-Instruct-v0.1": {
|
||||||
|
"max_tokens": 4096,
|
||||||
|
"input_cost_per_token": 0.0000002,
|
||||||
|
"output_cost_per_token": 0.0000002,
|
||||||
|
"litellm_provider": "deepinfra",
|
||||||
|
"mode": "chat"
|
||||||
|
},
|
||||||
|
"deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1": {
|
||||||
|
"max_tokens": 4096,
|
||||||
|
"input_cost_per_token": 0.0000007,
|
||||||
|
"output_cost_per_token": 0.00000095,
|
||||||
|
"litellm_provider": "deepinfra",
|
||||||
|
"mode": "chat"
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue