fix(utils.py): fix sagemaker async logging for sync streaming

https://github.com/BerriAI/litellm/issues/1592
2024-01-25 12:49:45 -08:00 · 2024-01-25 12:49:45 -08:00 · 09ec6d6458
commit 09ec6d6458
parent 39d5407e67
10 changed files with 247 additions and 64 deletions
--- a/proxy_server_config.yaml
+++ b/proxy_server_config.yaml
@ -11,6 +11,10 @@ model_list:
      api_base: https://openai-gpt-4-test-v-1.openai.azure.com/
      api_version: "2023-05-15"
      api_key: os.environ/AZURE_API_KEY # The `os.environ/` prefix tells litellm to read this from the env. See https://docs.litellm.ai/docs/simple_proxy#load-api-keys-from-vault
+  - model_name: sagemaker-completion-model
+    litellm_params:
+      model: sagemaker/berri-benchmarking-Llama-2-70b-chat-hf-4
+      input_cost_per_second: 0.000420  
  - model_name: gpt-4
    litellm_params:
      model: azure/gpt-turbo