diff --git a/.github/workflows/load_test.yml b/.github/workflows/load_test.yml index 3e4ae97f6..38adb6906 100644 --- a/.github/workflows/load_test.yml +++ b/.github/workflows/load_test.yml @@ -23,7 +23,7 @@ jobs: with: LOCUSTFILE: ".github/workflows/locustfile.py" URL: "https://litellm-database-docker-build-production.up.railway.app/" - USERS: "2000" + USERS: "200" RATE: "20" RUNTIME: "300s" - name: Process Load Test Stats diff --git a/.github/workflows/locustfile.py b/.github/workflows/locustfile.py index e25ae9bbf..ad7dd98f6 100644 --- a/.github/workflows/locustfile.py +++ b/.github/workflows/locustfile.py @@ -4,9 +4,7 @@ import time class MyUser(HttpUser): - wait_time = between(1, 5) - - @task(2) + @task(20) def chat_completion(self): headers = { "Content-Type": "application/json", @@ -29,13 +27,13 @@ class MyUser(HttpUser): # Print or log the response if needed - @task(10) + @task(40) def health_readiness(self): start_time = time.time() response = self.client.get("health/readiness") response_time = time.time() - start_time - @task(10) + @task(40) def health_liveliness(self): start_time = time.time() response = self.client.get("health/liveliness")