From e09f220600f90f2bd6dc04fa69c267d1c82b4517 Mon Sep 17 00:00:00 2001 From: lucca Date: Thu, 13 Jun 2024 21:24:07 -0300 Subject: [PATCH] llama 3 --- ...model_prices_and_context_window_backup.json | 18 ++++++++++++++++++ model_prices_and_context_window.json | 18 ++++++++++++++++++ 2 files changed, 36 insertions(+) diff --git a/litellm/model_prices_and_context_window_backup.json b/litellm/model_prices_and_context_window_backup.json index 385dc2ead..98da8d69c 100644 --- a/litellm/model_prices_and_context_window_backup.json +++ b/litellm/model_prices_and_context_window_backup.json @@ -3347,6 +3347,24 @@ "litellm_provider": "deepinfra", "mode": "chat" }, + "deepinfra/meta-llama/Meta-Llama-3-8B-Instruct": { + "max_tokens": 8191, + "max_input_tokens": 8191, + "max_output_tokens": 4096, + "input_cost_per_token": 0.00000008, + "output_cost_per_token": 0.00000008, + "litellm_provider": "deepinfra", + "mode": "chat" + }, + "deepinfra/meta-llama/Meta-Llama-3-70B-Instruct": { + "max_tokens": 8191, + "max_input_tokens": 8191, + "max_output_tokens": 4096, + "input_cost_per_token": 0.00000059, + "output_cost_per_token": 0.00000079, + "litellm_provider": "deepinfra", + "mode": "chat" + }, "deepinfra/01-ai/Yi-34B-200K": { "max_tokens": 4096, "max_input_tokens": 200000, diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index 385dc2ead..98da8d69c 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -3347,6 +3347,24 @@ "litellm_provider": "deepinfra", "mode": "chat" }, + "deepinfra/meta-llama/Meta-Llama-3-8B-Instruct": { + "max_tokens": 8191, + "max_input_tokens": 8191, + "max_output_tokens": 4096, + "input_cost_per_token": 0.00000008, + "output_cost_per_token": 0.00000008, + "litellm_provider": "deepinfra", + "mode": "chat" + }, + "deepinfra/meta-llama/Meta-Llama-3-70B-Instruct": { + "max_tokens": 8191, + "max_input_tokens": 8191, + "max_output_tokens": 4096, + "input_cost_per_token": 0.00000059, + "output_cost_per_token": 0.00000079, + "litellm_provider": "deepinfra", + "mode": "chat" + }, "deepinfra/01-ai/Yi-34B-200K": { "max_tokens": 4096, "max_input_tokens": 200000,