adding support for completions endpoint in proxy

2025-04-27 03:34:10 +00:00 · 2023-09-27 21:04:15 -07:00 · 2023-09-27 21:04:15 -07:00 · c737462beb
commit c737462beb
parent b08aea851f
5 changed files with 42 additions and 4 deletions
--- a/litellm/pycache/main.cpython-311.pyc
+++ b/litellm/pycache/main.cpython-311.pyc
--- a/litellm/main.py
+++ b/litellm/main.py
@ -1431,7 +1431,25 @@ def text_completion(*args, **kwargs):
        messages = [{"role": "system", "content": kwargs["prompt"]}]
        kwargs["messages"] = messages
        kwargs.pop("prompt")
-        return completion(*args, **kwargs)
+        response = completion(*args, **kwargs) # assume the response is the openai response object 
+        response_2 = {
+            "id": response["id"],
+            "object": "text_completion",
+            "created": response["created"],
+            "model": response["model"],
+            "choices": [
+            {
+                "text": response["choices"][0]["message"]["content"],
+                "index": response["choices"][0]["index"],
+                "logprobs": None,
+                "finish_reason": response["choices"][0]["finish_reason"]
+            }
+            ],
+            "usage": response["usage"]
+        }
+        return response_2
+    else:
+        raise ValueError("please pass prompt into the `text_completion` endpoint - `text_completion(model, prompt='hello world')`")

 ##### Moderation #######################
 def moderation(input: str, api_key: Optional[str]=None):
--- a/litellm/proxy/proxy_cli.py
+++ b/litellm/proxy/proxy_cli.py
@ -7,7 +7,8 @@ load_dotenv()
@click.option('--api_base', default=None, help='API base URL.')
@click.option('--model', required=True, help='The model name to pass to litellm expects') 
 def run_server(port, api_base, model):
-    from .proxy_server import app, initialize
+    # from .proxy_server import app, initialize
+    from proxy_server import app, initialize
    initialize(model, api_base)
    try:
        import uvicorn
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -1,4 +1,10 @@
+import sys, os
+sys.path.insert(
+    0, os.path.abspath("../..")
+)  # Adds the parent directory to the system path
+
 import litellm
+print(litellm.__file__)
 from fastapi import FastAPI, Request
 from fastapi.responses import StreamingResponse
 import json
@ -25,8 +31,21 @@ def model_list():
        object="list",
    )

-@app.post("/chat/completions")
+@app.post("/completions")
 async def completion(request: Request):
+    data = await request.json()
+    if (user_model is None):
+        raise ValueError("Proxy model needs to be set")
+    data["model"] = user_model
+    if user_api_base:
+        data["api_base"] = user_api_base
+    response = litellm.text_completion(**data)
+    if 'stream' in data and data['stream'] == True: # use generate_responses to stream responses
+            return StreamingResponse(data_generator(response), media_type='text/event-stream')
+    return response
+
+@app.post("/chat/completions")
+async def chat_completion(request: Request):
    data = await request.json()
    if (user_model is None):
        raise ValueError("Proxy model needs to be set")
--- a/pyproject.toml
+++ b/pyproject.toml
@ -1,6 +1,6 @@
 [tool.poetry]
 name = "litellm"
-version = "0.1.789"
+version = "0.1.790"
 description = "Library to easily interface with LLM API providers"
 authors = ["BerriAI"]
 license = "MIT License"