feat(proxy_cli.py): when user calls ollama model, run ollama serve

2025-04-25 10:44:24 +00:00 · 2023-10-06 16:45:26 -07:00 · 2023-10-06 16:45:26 -07:00 · 52b0bcb5ec
commit 52b0bcb5ec
parent 56c87febae
4 changed files with 8 additions and 0 deletions
--- a/litellm/proxy/proxy_cli.py
+++ b/litellm/proxy/proxy_cli.py
@ -13,6 +13,12 @@ config_filename = ".env.litellm"
 config_dir = appdirs.user_config_dir("litellm")
 user_config_path = os.path.join(config_dir, config_filename)

+def run_ollama_serve():
+    command = ['ollama', 'serve']
+    
+    with open(os.devnull, 'w') as devnull:
+        process = subprocess.Popen(command, stdout=devnull, stderr=devnull)
+
 def load_config():
    try: 
        if not os.path.exists(user_config_path):
@ -82,6 +88,8 @@ def run_server(port, api_base, model, deploy, debug, temperature, max_tokens, te

        print(f"\033[32mLiteLLM: Test your URL using the following: \"litellm --test {url}\"\033[0m")
        return
+    if "ollama" in model: 
+        run_ollama_serve()
    if test != False:
        click.echo('LiteLLM: Making a test ChatCompletions request to your proxy')
        import openai