build: migrate all constants into constants.py

2025-04-25 18:54:30 +00:00 · 2025-03-24 18:11:21 -07:00 · 2025-03-24 18:11:21 -07:00 · c11e0de69d
commit c11e0de69d
parent 7882bdc787
3 changed files with 11 additions and 5 deletions
--- a/litellm/constants.py
+++ b/litellm/constants.py
@ -18,9 +18,13 @@ MAX_SIZE_PER_ITEM_IN_MEMORY_CACHE_IN_KB = 1024  # 1MB = 1024KB
 SINGLE_DEPLOYMENT_TRAFFIC_FAILURE_THRESHOLD = 1000  # Minimum number of requests to consider "reasonable traffic". Used for single-deployment cooldown logic.
 #### RELIABILITY ####
 REPEATED_STREAMING_CHUNK_LIMIT = 100  # catch if model starts looping the same chunk while streaming. Uses high default to prevent false positives.
+DEFAULT_MAX_LRU_CACHE_SIZE = 16
 #### Networking settings ####
 request_timeout: float = 6000  # time in seconds
 STREAM_SSE_DONE_STRING: str = "[DONE]"
+### SPEND TRACKING ###
+DEFAULT_REPLICATE_GPU_PRICE_PER_SECOND = 0.001400  # price per second for a100 80GB
+

 LITELLM_CHAT_PROVIDERS = [
    "openai",