(fix) together_ai use sync generator

2024-01-23 20:07:26 -08:00 · 2024-01-23 20:07:26 -08:00 · 2d26875eb0
commit 2d26875eb0
parent fcd66eac7d
2 changed files with 10 additions and 8 deletions
--- a/litellm/proxy/proxy_config.yaml
+++ b/litellm/proxy/proxy_config.yaml
@ -25,6 +25,9 @@ model_list:
  - model_name: BEDROCK_GROUP
    litellm_params:
      model: bedrock/cohere.command-text-v14
  - model_name: tg-ai
    litellm_params:
      model: together_ai/mistralai/Mistral-7B-Instruct-v0.1
  - model_name: sagemaker
    litellm_params:
      model: sagemaker/berri-benchmarking-Llama-2-70b-chat-hf-4
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -1450,10 +1450,9 @@ async def async_data_generator(response, user_api_key_dict):
 def select_data_generator(response, user_api_key_dict):
    try:
        # since boto3 - sagemaker does not support async calls, we should use a sync data_generator
-        if (
+        if hasattr(
-            hasattr(response, "custom_llm_provider")
+            response, "custom_llm_provider"
-            and response.custom_llm_provider == "sagemaker"
+        ) and response.custom_llm_provider in ["sagemaker", "together_ai"]:
        ):
            return data_generator(
                response=response,
            )
@ -2243,13 +2242,14 @@ async def generate_key_fn(
        if "max_budget" in data_json:
            data_json["key_max_budget"] = data_json.pop("max_budget", None)
        if "budget_duration" in data_json:
            data_json["key_budget_duration"] = data_json.pop("budget_duration", None)
        response = await generate_key_helper_fn(**data_json)
        return GenerateKeyResponse(
-            key=response["token"], expires=response["expires"], user_id=response["user_id"]
+            key=response["token"],
            expires=response["expires"],
            user_id=response["user_id"],
        )
    except Exception as e:
        if isinstance(e, HTTPException):
@ -2269,7 +2269,6 @@ async def generate_key_fn(
        )
@router.post(
    "/key/update", tags=["key management"], dependencies=[Depends(user_api_key_auth)]
 )