From ad7302cdc8cd1818250e83a18d11b57b97566cf5 Mon Sep 17 00:00:00 2001
From: Ishaan Jaff <ishaanjaffer0324@gmail.com>
Date: Sat, 6 Apr 2024 11:25:33 -0700
Subject: [PATCH 1/5] feat - re-use openai client for text completion

---
 litellm/main.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/litellm/main.py b/litellm/main.py
index 24243d0d6f..c3865c77bb 100644
--- a/litellm/main.py
+++ b/litellm/main.py
@@ -1059,6 +1059,7 @@ def completion(
                 api_key=api_key,
                 api_base=api_base,
                 acompletion=acompletion,
+                client=client,  # pass AsyncOpenAI, OpenAI client
                 logging_obj=logging,
                 optional_params=optional_params,
                 litellm_params=litellm_params,

From 01fef1a9f872551e882c45deca46ecbc313b4d15 Mon Sep 17 00:00:00 2001
From: Ishaan Jaff <ishaanjaffer0324@gmail.com>
Date: Sat, 6 Apr 2024 11:28:25 -0700
Subject: [PATCH 2/5] feat - re-use openai client for text completion

---
 litellm/router.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/litellm/router.py b/litellm/router.py
index 8c7c1be589..452251a7e4 100644
--- a/litellm/router.py
+++ b/litellm/router.py
@@ -1769,6 +1769,7 @@ class Router:
             or custom_llm_provider == "azure"
             or custom_llm_provider == "custom_openai"
             or custom_llm_provider == "openai"
+            or custom_llm_provider == "text-completion-openai"
             or "ft:gpt-3.5-turbo" in model_name
             or model_name in litellm.open_ai_embedding_models
         ):

From a55f3cdace4cb2b7df3dff16add88fa5dd2ba76a Mon Sep 17 00:00:00 2001
From: Ishaan Jaff <ishaanjaffer0324@gmail.com>
Date: Sat, 6 Apr 2024 11:33:17 -0700
Subject: [PATCH 3/5] test - router re-use openai client

---
 litellm/tests/test_router.py | 32 ++++++++++++++++++++++++++++++++
 1 file changed, 32 insertions(+)

diff --git a/litellm/tests/test_router.py b/litellm/tests/test_router.py
index 3a6043b5a7..97e058ec39 100644
--- a/litellm/tests/test_router.py
+++ b/litellm/tests/test_router.py
@@ -1228,3 +1228,35 @@ def test_router_add_deployment():
     assert len(new_model_id_list) > len(init_model_id_list)
 
     assert new_model_id_list[1] != new_model_id_list[0]
+
+
+@pytest.mark.asyncio
+async def test_router_text_completion_client():
+    # This tests if we re-use the Async OpenAI client
+    # This test fails when we create a new Async OpenAI client per request
+    try:
+        model_list = [
+            {
+                "model_name": "fake-openai-endpoint",
+                "litellm_params": {
+                    "model": "text-completion-openai/gpt-3.5-turbo-instruct",
+                    "api_key": os.getenv("OPENAI_API_KEY", None),
+                    "api_base": "https://exampleopenaiendpoint-production.up.railway.app/",
+                },
+            }
+        ]
+        router = Router(model_list=model_list, debug_level="DEBUG", set_verbose=True)
+        tasks = []
+        for _ in range(300):
+            tasks.append(
+                router.atext_completion(
+                    model="fake-openai-endpoint",
+                    prompt="hello from litellm test",
+                )
+            )
+
+        # Execute all coroutines concurrently
+        responses = await asyncio.gather(*tasks)
+        print(responses)
+    except Exception as e:
+        pytest.fail(f"Error occurred: {e}")

From 3b622556bef8e4ea586a81969f2a8a0530af3c72 Mon Sep 17 00:00:00 2001
From: Ishaan Jaff <ishaanjaffer0324@gmail.com>
Date: Sat, 6 Apr 2024 11:53:26 -0700
Subject: [PATCH 4/5] test - setting org for openai text completion

---
 litellm/tests/test_router_init.py | 60 +++++++++++++++++++++++++++++++
 1 file changed, 60 insertions(+)

diff --git a/litellm/tests/test_router_init.py b/litellm/tests/test_router_init.py
index 0e5ca21a2d..862d7e9658 100644
--- a/litellm/tests/test_router_init.py
+++ b/litellm/tests/test_router_init.py
@@ -490,3 +490,63 @@ def test_init_clients_azure_command_r_plus():
     except Exception as e:
         traceback.print_exc()
         pytest.fail(f"Error occurred: {e}")
+
+
+@pytest.mark.asyncio
+async def test_text_completion_with_organization():
+    try:
+        print("Testing Text OpenAI with organization")
+        model_list = [
+            {
+                "model_name": "openai-bad-org",
+                "litellm_params": {
+                    "model": "text-completion-openai/gpt-3.5-turbo-instruct",
+                    "api_key": os.getenv("OPENAI_API_KEY", None),
+                    "organization": "org-ikDc4ex8NB",
+                },
+            },
+            {
+                "model_name": "openai-good-org",
+                "litellm_params": {
+                    "model": "text-completion-openai/gpt-3.5-turbo-instruct",
+                    "api_key": os.getenv("OPENAI_API_KEY", None),
+                    "organization": os.getenv("OPENAI_ORGANIZATION", None),
+                },
+            },
+        ]
+
+        router = Router(model_list=model_list)
+
+        print(router.model_list)
+        print(router.model_list[0])
+
+        openai_client = router._get_client(
+            deployment=router.model_list[0],
+            kwargs={"input": ["hello"], "model": "openai-bad-org"},
+        )
+        print(vars(openai_client))
+
+        assert openai_client.organization == "org-ikDc4ex8NB"
+
+        # bad org raises error
+
+        try:
+            response = await router.atext_completion(
+                model="openai-bad-org",
+                prompt="this is a test",
+            )
+            pytest.fail("Request should have failed - This organization does not exist")
+        except Exception as e:
+            print("Got exception: " + str(e))
+            assert "No such organization: org-ikDc4ex8NB" in str(e)
+
+        # good org works
+        response = await router.atext_completion(
+            model="openai-good-org",
+            prompt="this is a test",
+            max_tokens=5,
+        )
+        print("working response: ", response)
+
+    except Exception as e:
+        pytest.fail(f"Error occurred: {e}")

From c2f978fd5aadf0fbc509942b7fbe13de83bd27af Mon Sep 17 00:00:00 2001
From: Ishaan Jaff <ishaanjaffer0324@gmail.com>
Date: Sat, 6 Apr 2024 12:07:20 -0700
Subject: [PATCH 5/5] (docs) use text completion with litellm proxy

---
 docs/my-website/docs/providers/openai.md | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/docs/my-website/docs/providers/openai.md b/docs/my-website/docs/providers/openai.md
index ccb2c418bc..17ad678463 100644
--- a/docs/my-website/docs/providers/openai.md
+++ b/docs/my-website/docs/providers/openai.md
@@ -44,7 +44,11 @@ export OPENAI_API_KEY=""
 model_list:
   - model_name: gpt-3.5-turbo
     litellm_params:
-      model: gpt-3.5-turbo
+      model: openai/gpt-3.5-turbo                          # The `openai/` prefix will call openai.chat.completions.create
+      api_key: os.environ/OPENAI_API_KEY
+  - model_name: gpt-3.5-turbo-instruct
+    litellm_params:
+      model: text-completion-openai/gpt-3.5-turbo-instruct # The `text-completion-openai/` prefix will call openai.completions.create
       api_key: os.environ/OPENAI_API_KEY
 ```
 </TabItem>