From e14ef3eeda8d921ef3feaf3fae7bfe820ec69169 Mon Sep 17 00:00:00 2001 From: Wanis Elabbar <70503629+elabbarw@users.noreply.github.com> Date: Tue, 23 Jul 2024 23:57:50 +0100 Subject: [PATCH] feat - add azure_ai llama v3.1 8B 70B and 405B --- model_prices_and_context_window.json | 27 +++++++++++++++++++++++++++ 1 file changed, 27 insertions(+) diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index f86ea8bd7..4c6dd8fdb 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -760,6 +760,33 @@ "litellm_provider": "azure_ai", "mode": "chat" }, + "azure_ai/Meta-Llama-31-8B-Instruct": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 0.0000003, + "output_cost_per_token": 0.00000061, + "litellm_provider": "azure_ai", + "mode": "chat" + }, + "azure_ai/Meta-Llama-31-70B-Instruct": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 0.00000268, + "output_cost_per_token": 0.00000354, + "litellm_provider": "azure_ai", + "mode": "chat" + }, + "azure_ai/Meta-Llama-31-405B-Instruct": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 0.00000533, + "output_cost_per_token": 0.000016, + "litellm_provider": "azure_ai", + "mode": "chat" + }, "babbage-002": { "max_tokens": 16384, "max_input_tokens": 16384,