Merge pull request #2877 from BerriAI/litellm_fix_text_completion

[Feat] Text-Completion-OpenAI - Re-use OpenAI Client
2025-04-26 11:14:04 +00:00 · 2024-04-06 12:15:52 -07:00 · 2024-04-06 12:15:52 -07:00 · a2c63075ef
commit a2c63075ef
parent b49e47b634 c2f978fd5a
5 changed files with 99 additions and 1 deletions
--- a/docs/my-website/docs/providers/openai.md
+++ b/docs/my-website/docs/providers/openai.md
@ -44,7 +44,11 @@ export OPENAI_API_KEY=""
 model_list:
  - model_name: gpt-3.5-turbo
    litellm_params:
-      model: gpt-3.5-turbo
+      model: openai/gpt-3.5-turbo                          # The `openai/` prefix will call openai.chat.completions.create
      api_key: os.environ/OPENAI_API_KEY
  - model_name: gpt-3.5-turbo-instruct
    litellm_params:
      model: text-completion-openai/gpt-3.5-turbo-instruct # The `text-completion-openai/` prefix will call openai.completions.create
      api_key: os.environ/OPENAI_API_KEY
 ```
 </TabItem>
--- a/litellm/main.py
+++ b/litellm/main.py
@ -1060,6 +1060,7 @@ def completion(
                api_key=api_key,
                api_base=api_base,
                acompletion=acompletion,
                client=client,  # pass AsyncOpenAI, OpenAI client
                logging_obj=logging,
                optional_params=optional_params,
                litellm_params=litellm_params,
--- a/litellm/router.py
+++ b/litellm/router.py
@ -1769,6 +1769,7 @@ class Router:
            or custom_llm_provider == "azure"
            or custom_llm_provider == "custom_openai"
            or custom_llm_provider == "openai"
            or custom_llm_provider == "text-completion-openai"
            or "ft:gpt-3.5-turbo" in model_name
            or model_name in litellm.open_ai_embedding_models
        ):
--- a/litellm/tests/test_router.py
+++ b/litellm/tests/test_router.py
@ -1228,3 +1228,35 @@ def test_router_add_deployment():
    assert len(new_model_id_list) > len(init_model_id_list)
    assert new_model_id_list[1] != new_model_id_list[0]
@pytest.mark.asyncio
 async def test_router_text_completion_client():
    # This tests if we re-use the Async OpenAI client
    # This test fails when we create a new Async OpenAI client per request
    try:
        model_list = [
            {
                "model_name": "fake-openai-endpoint",
                "litellm_params": {
                    "model": "text-completion-openai/gpt-3.5-turbo-instruct",
                    "api_key": os.getenv("OPENAI_API_KEY", None),
                    "api_base": "https://exampleopenaiendpoint-production.up.railway.app/",
                },
            }
        ]
        router = Router(model_list=model_list, debug_level="DEBUG", set_verbose=True)
        tasks = []
        for _ in range(300):
            tasks.append(
                router.atext_completion(
                    model="fake-openai-endpoint",
                    prompt="hello from litellm test",
                )
            )
        # Execute all coroutines concurrently
        responses = await asyncio.gather(*tasks)
        print(responses)
    except Exception as e:
        pytest.fail(f"Error occurred: {e}")
--- a/litellm/tests/test_router_init.py
+++ b/litellm/tests/test_router_init.py
@ -490,3 +490,63 @@ def test_init_clients_azure_command_r_plus():
    except Exception as e:
        traceback.print_exc()
        pytest.fail(f"Error occurred: {e}")
@pytest.mark.asyncio
 async def test_text_completion_with_organization():
    try:
        print("Testing Text OpenAI with organization")
        model_list = [
            {
                "model_name": "openai-bad-org",
                "litellm_params": {
                    "model": "text-completion-openai/gpt-3.5-turbo-instruct",
                    "api_key": os.getenv("OPENAI_API_KEY", None),
                    "organization": "org-ikDc4ex8NB",
                },
            },
            {
                "model_name": "openai-good-org",
                "litellm_params": {
                    "model": "text-completion-openai/gpt-3.5-turbo-instruct",
                    "api_key": os.getenv("OPENAI_API_KEY", None),
                    "organization": os.getenv("OPENAI_ORGANIZATION", None),
                },
            },
        ]
        router = Router(model_list=model_list)
        print(router.model_list)
        print(router.model_list[0])
        openai_client = router._get_client(
            deployment=router.model_list[0],
            kwargs={"input": ["hello"], "model": "openai-bad-org"},
        )
        print(vars(openai_client))
        assert openai_client.organization == "org-ikDc4ex8NB"
        # bad org raises error
        try:
            response = await router.atext_completion(
                model="openai-bad-org",
                prompt="this is a test",
            )
            pytest.fail("Request should have failed - This organization does not exist")
        except Exception as e:
            print("Got exception: " + str(e))
            assert "No such organization: org-ikDc4ex8NB" in str(e)
        # good org works
        response = await router.atext_completion(
            model="openai-good-org",
            prompt="this is a test",
            max_tokens=5,
        )
        print("working response: ", response)
    except Exception as e:
        pytest.fail(f"Error occurred: {e}")