From 8fb237b6fbda905e28fc0bf86d01e6fbf5a08d97 Mon Sep 17 00:00:00 2001 From: r-bit-rry Date: Mon, 17 Nov 2025 11:53:12 +0200 Subject: [PATCH] adding warning --- src/llama_stack/cli/stack/run.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/llama_stack/cli/stack/run.py b/src/llama_stack/cli/stack/run.py index 4778abc06..b3a60f54e 100644 --- a/src/llama_stack/cli/stack/run.py +++ b/src/llama_stack/cli/stack/run.py @@ -375,6 +375,10 @@ class StackRun(Subcommand): logger.info(f"Worker recycling: every {max_requests}±{max_requests_jitter} requests (prevents memory leaks)") logger.info(f"Total concurrent capacity: {num_workers * worker_connections} connections") + # Warn if using SQLite with multiple workers + if num_workers > 1 and os.getenv("SQLITE_STORE_DIR"): + logger.warning("SQLite detected with multiple GUNICORN workers - writes will be serialized.") + # Execute the Gunicorn command # If Gunicorn is not found or fails to start, raise the exception for the caller to handle subprocess.run(gunicorn_command, check=True)