fix(pattern_match_deployments.py): default to user input if unable to… (#6632)

* fix(pattern_match_deployments.py): default to user input if unable to map based on wildcards * test: fix test * test: reset test name * test: update conftest to reload proxy server module between tests * ci(config.yml): move langfuse out of local_testing reduce ci/cd time * ci(config.yml): cleanup langfuse ci/cd tests * fix: update test to not use global proxy_server app module * ci: move caching to a separate test pipeline speed up ci pipeline * test: update conftest to check if proxy_server attr exists before reloading * build(conftest.py): don't block on inability to reload proxy_server * ci(config.yml): update caching unit test filter to work on 'cache' keyword as well * fix(encrypt_decrypt_utils.py): use function to get salt key * test: mark flaky test * test: handle anthropic overloaded errors * refactor: create separate ci/cd pipeline for proxy unit tests make ci/cd faster * ci(config.yml): add litellm_proxy_unit_testing to build_and_test jobs * ci(config.yml): generate prisma binaries for proxy unit tests * test: readd vertex_key.json * ci(config.yml): remove `-s` from proxy_unit_test cmd speed up test * ci: remove any 'debug' logging flag speed up ci pipeline * test: fix test * test(test_braintrust.py): rerun * test: add delay for braintrust test
2024-11-08 00:55:57 +05:30 · 2024-11-08 00:55:57 +05:30 · 27e18358ab
commit 27e18358ab
parent 44840d615d
77 changed files with 2861 additions and 76 deletions
--- a/tests/local_testing/test_proxy_server_caching.py
+++ b/tests/local_testing/test_proxy_server_caching.py
@ -1,104 +0,0 @@
-#### What this tests ####
-#    This tests using caching w/ litellm which requires SSL=True
-import sys, os
-import traceback
-from dotenv import load_dotenv
-
-load_dotenv()
-import os, io
-
-# this file is to test litellm/proxy
-
-sys.path.insert(
-    0, os.path.abspath("../..")
-)  # Adds the parent directory to the system path
-import pytest, logging, asyncio
-import litellm
-from litellm import embedding, completion, completion_cost, Timeout
-from litellm import RateLimitError
-
-# Configure logging
-logging.basicConfig(
-    level=logging.DEBUG,  # Set the desired logging level
-    format="%(asctime)s - %(levelname)s - %(message)s",
-)
-
-# test /chat/completion request to the proxy
-from fastapi.testclient import TestClient
-from fastapi import FastAPI
-from litellm.proxy.proxy_server import (
-    router,
-    save_worker_config,
-    initialize,
-)  # Replace with the actual module where your FastAPI router is defined
-
-# Your bearer token
-token = "sk-1234"
-
-headers = {"Authorization": f"Bearer {token}"}
-
-
-@pytest.fixture(scope="function")
-def client_no_auth():
-    # Assuming litellm.proxy.proxy_server is an object
-    from litellm.proxy.proxy_server import cleanup_router_config_variables
-
-    cleanup_router_config_variables()
-    filepath = os.path.dirname(os.path.abspath(__file__))
-    config_fp = f"{filepath}/test_configs/test_cloudflare_azure_with_cache_config.yaml"
-    # initialize can get run in parallel, it sets specific variables for the fast api app, sinc eit gets run in parallel different tests use the wrong variables
-    asyncio.run(initialize(config=config_fp, debug=True))
-    app = FastAPI()
-    app.include_router(router)  # Include your router in the test app
-
-    return TestClient(app)
-
-
-def generate_random_word(length=4):
-    import string, random
-
-    letters = string.ascii_lowercase
-    return "".join(random.choice(letters) for _ in range(length))
-
-
-@pytest.mark.skip(reason="AWS Suspended Account")
-def test_chat_completion(client_no_auth):
-    global headers
-    try:
-        user_message = f"Write a poem about {generate_random_word()}"
-        messages = [{"content": user_message, "role": "user"}]
-        # Your test data
-        test_data = {
-            "model": "azure-cloudflare",
-            "messages": messages,
-            "max_tokens": 10,
-        }
-
-        print("testing proxy server with chat completions")
-        response = client_no_auth.post("/v1/chat/completions", json=test_data)
-        print(f"response - {response.text}")
-        assert response.status_code == 200
-
-        response = response.json()
-        print(response)
-
-        content = response["choices"][0]["message"]["content"]
-        response1_id = response["id"]
-
-        print("\n content", content)
-
-        assert len(content) > 1
-
-        print("\nmaking 2nd request to proxy. Testing caching + non streaming")
-        response = client_no_auth.post("/v1/chat/completions", json=test_data)
-        print(f"response - {response.text}")
-        assert response.status_code == 200
-
-        response = response.json()
-        print(response)
-        response2_id = response["id"]
-        assert response1_id == response2_id
-        litellm.disable_cache()
-
-    except Exception as e:
-        pytest.fail(f"LiteLLM Proxy test failed. Exception - {str(e)}")