fix(proxy_server.py): track cost for global proxy

This commit is contained in:
Krrish Dholakia 2024-01-24 16:06:10 -08:00
parent ba24037baf
commit 574208f005
3 changed files with 44 additions and 22 deletions

View file

@ -636,29 +636,39 @@ async def update_database(
### UPDATE USER SPEND ### ### UPDATE USER SPEND ###
async def _update_user_db(): async def _update_user_db():
if user_id is None: """
return - Update that user's row
if prisma_client is not None: - Update litellm-proxy-budget row (global proxy spend)
existing_spend_obj = await prisma_client.get_data(user_id=user_id) """
elif custom_db_client is not None: user_ids = [user_id, "litellm-proxy-budget"]
existing_spend_obj = await custom_db_client.get_data( data_list = []
key=user_id, table_name="user" for id in user_ids:
) if id is None:
if existing_spend_obj is None: continue
existing_spend = 0 if prisma_client is not None:
else: existing_spend_obj = await prisma_client.get_data(user_id=id)
existing_spend = existing_spend_obj.spend elif custom_db_client is not None:
existing_spend_obj = await custom_db_client.get_data(
key=id, table_name="user"
)
if existing_spend_obj is None:
existing_spend = 0
else:
existing_spend = existing_spend_obj.spend
# Calculate the new cost by adding the existing cost and response_cost # Calculate the new cost by adding the existing cost and response_cost
new_spend = existing_spend + response_cost existing_spend_obj.spend = existing_spend + response_cost
verbose_proxy_logger.debug(f"new cost: {existing_spend_obj.spend}")
data_list.append(existing_spend_obj)
verbose_proxy_logger.debug(f"new cost: {new_spend}")
# Update the cost column for the given user id # Update the cost column for the given user id
if prisma_client is not None: if prisma_client is not None:
await prisma_client.update_data( await prisma_client.update_data(
user_id=user_id, data={"spend": new_spend} data_list=data_list, query_type="update_many", table_name="user"
) )
elif custom_db_client is not None: elif custom_db_client is not None and user_id is not None:
new_spend = data_list[0].spend
await custom_db_client.update_data( await custom_db_client.update_data(
key=user_id, value={"spend": new_spend}, table_name="user" key=user_id, value={"spend": new_spend}, table_name="user"
) )
@ -1563,7 +1573,13 @@ async def startup_event():
if prisma_client is not None and master_key is not None: if prisma_client is not None and master_key is not None:
# add master key to db # add master key to db
await generate_key_helper_fn( await generate_key_helper_fn(
duration=None, models=[], aliases={}, config={}, spend=0, token=master_key duration=None,
models=[],
aliases={},
config={},
spend=0,
token=master_key,
user_id="default_user_id",
) )
if ( if (

View file

@ -634,7 +634,7 @@ class PrismaClient:
"update": {}, # don't do anything if it already exists "update": {}, # don't do anything if it already exists
}, },
) )
print_verbose( verbose_proxy_logger.info(
"\033[91m" "\033[91m"
+ f"DB User Table - update succeeded {update_user_row}" + f"DB User Table - update succeeded {update_user_row}"
+ "\033[0m" + "\033[0m"
@ -678,6 +678,7 @@ class PrismaClient:
Batch write update queries Batch write update queries
""" """
batcher = self.db.batch_() batcher = self.db.batch_()
verbose_proxy_logger.debug(f"data list for user table: {data_list}")
for idx, user in enumerate(data_list): for idx, user in enumerate(data_list):
try: try:
data_json = self.jsonify_object(data=user.model_dump()) data_json = self.jsonify_object(data=user.model_dump())
@ -688,8 +689,8 @@ class PrismaClient:
data={**data_json}, # type: ignore data={**data_json}, # type: ignore
) )
await batcher.commit() await batcher.commit()
print_verbose( verbose_proxy_logger.info(
"\033[91m" + f"DB User Table update succeeded" + "\033[0m" "\033[91m" + f"DB User Table Batch update succeeded" + "\033[0m"
) )
except Exception as e: except Exception as e:
asyncio.create_task( asyncio.create_task(

View file

@ -1090,7 +1090,12 @@ class Logging:
else: # streaming chunks + image gen. else: # streaming chunks + image gen.
self.model_call_details["response_cost"] = None self.model_call_details["response_cost"] = None
if litellm.max_budget and self.stream: if (
litellm.max_budget
and self.stream
and result is not None
and "content" in result
):
time_diff = (end_time - start_time).total_seconds() time_diff = (end_time - start_time).total_seconds()
float_diff = float(time_diff) float_diff = float(time_diff)
litellm._current_cost += litellm.completion_cost( litellm._current_cost += litellm.completion_cost(