auto update the model in cachedContents request

2025-04-26 11:14:04 +00:00 · 2024-08-08 15:56:46 -07:00 · 2024-08-08 15:56:46 -07:00 · cae941f4c0
commit cae941f4c0
parent 0d662368ac
1 changed files with 6 additions and 0 deletions
--- a/litellm/llms/fine_tuning_apis/vertex_ai.py
+++ b/litellm/llms/fine_tuning_apis/vertex_ai.py
@ -279,6 +279,12 @@ class VertexFineTuningAPI(VertexLLM):
        elif "countTokens" in request_route:
            url = f"https://{vertex_location}-aiplatform.googleapis.com/v1/projects/{vertex_project}/locations/{vertex_location}{request_route}"
        elif "cachedContents" in request_route:
+            _model = request_data.get("model")
+            if _model is not None and "/publishers/google/models/" not in _model:
+                request_data["model"] = (
+                    f"projects/{vertex_project}/locations/{vertex_location}/publishers/google/models/{_model}"
+                )
+
            url = f"https://{vertex_location}-aiplatform.googleapis.com/v1beta1/projects/{vertex_project}/locations/{vertex_location}{request_route}"
        else:
            raise ValueError(f"Unsupported Vertex AI request route: {request_route}")