mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-25 18:54:30 +00:00
* ci(config.yml): add a 'check_code_quality' step Addresses https://github.com/BerriAI/litellm/issues/5991 * ci(config.yml): check why circle ci doesn't pick up this test * ci(config.yml): fix to run 'check_code_quality' tests * fix(__init__.py): fix unprotected import * fix(__init__.py): don't remove unused imports * build(ruff.toml): update ruff.toml to ignore unused imports * fix: fix: ruff + pyright - fix linting + type-checking errors * fix: fix linting errors * fix(lago.py): fix module init error * fix: fix linting errors * ci(config.yml): cd into correct dir for checks * fix(proxy_server.py): fix linting error * fix(utils.py): fix bare except causes ruff linting errors * fix: ruff - fix remaining linting errors * fix(clickhouse.py): use standard logging object * fix(__init__.py): fix unprotected import * fix: ruff - fix linting errors * fix: fix linting errors * ci(config.yml): cleanup code qa step (formatting handled in local_testing) * fix(_health_endpoints.py): fix ruff linting errors * ci(config.yml): just use ruff in check_code_quality pipeline for now * build(custom_guardrail.py): include missing file * style(embedding_handler.py): fix ruff check
53 lines
1.6 KiB
Python
53 lines
1.6 KiB
Python
import traceback
|
|
|
|
from fastapi import HTTPException
|
|
|
|
import litellm
|
|
from litellm import verbose_logger
|
|
from litellm.caching import DualCache
|
|
from litellm.integrations.custom_logger import CustomLogger
|
|
from litellm.proxy._types import UserAPIKeyAuth
|
|
|
|
|
|
class _PROXY_MaxBudgetLimiter(CustomLogger):
|
|
# Class variables or attributes
|
|
def __init__(self):
|
|
pass
|
|
|
|
def print_verbose(self, print_statement):
|
|
if litellm.set_verbose is True:
|
|
print(print_statement) # noqa
|
|
|
|
async def async_pre_call_hook(
|
|
self,
|
|
user_api_key_dict: UserAPIKeyAuth,
|
|
cache: DualCache,
|
|
data: dict,
|
|
call_type: str,
|
|
):
|
|
try:
|
|
self.print_verbose("Inside Max Budget Limiter Pre-Call Hook")
|
|
cache_key = f"{user_api_key_dict.user_id}_user_api_key_user_id"
|
|
user_row = cache.get_cache(cache_key)
|
|
if user_row is None: # value not yet cached
|
|
return
|
|
max_budget = user_row["max_budget"]
|
|
curr_spend = user_row["spend"]
|
|
|
|
if max_budget is None:
|
|
return
|
|
|
|
if curr_spend is None:
|
|
return
|
|
|
|
# CHECK IF REQUEST ALLOWED
|
|
if curr_spend >= max_budget:
|
|
raise HTTPException(status_code=429, detail="Max budget limit reached.")
|
|
except HTTPException as e:
|
|
raise e
|
|
except Exception as e:
|
|
verbose_logger.exception(
|
|
"litellm.proxy.hooks.max_budget_limiter.py::async_pre_call_hook(): Exception occured - {}".format(
|
|
str(e)
|
|
)
|
|
)
|