anthropic prompt caching cost tracking (#5453)

* fix(utils.py): support 'drop_params' for embedding requests Fixes https://github.com/BerriAI/litellm/issues/5444 * feat(anthropic/cost_calculation.py): Support calculating cost for prompt caching on anthropic * feat(types/utils.py): allows us to migrate to openai's equivalent, once that comes out * fix: fix linting errors * test: mark flaky test
2025-04-27 11:43:54 +00:00 · 2024-08-31 14:09:35 -07:00 · 2024-08-31 14:09:35 -07:00 · aa9f1896c6
commit aa9f1896c6
parent 6aaa7a75cd
17 changed files with 432 additions and 84 deletions
--- a/litellm/llms/base.py
+++ b/litellm/llms/base.py
@ -1,11 +1,14 @@
 ## This is a template base class to be used for adding new LLM providers via API calls
+from typing import Any, Optional, Union
+
+import httpx
+import requests
+
 import litellm
-import httpx, requests
-from typing import Optional, Union
-from litellm.litellm_core_utils.litellm_logging import Logging


 class BaseLLM:
+
    _client_session: Optional[httpx.Client] = None

    def process_response(
@ -14,7 +17,7 @@ class BaseLLM:
        response: Union[requests.Response, httpx.Response],
        model_response: litellm.utils.ModelResponse,
        stream: bool,
-        logging_obj: Logging,
+        logging_obj: Any,
        optional_params: dict,
        api_key: str,
        data: Union[dict, str],
@ -33,7 +36,7 @@ class BaseLLM:
        response: Union[requests.Response, httpx.Response],
        model_response: litellm.utils.TextCompletionResponse,
        stream: bool,
-        logging_obj: Logging,
+        logging_obj: Any,
        optional_params: dict,
        api_key: str,
        data: Union[dict, str],