fix(proxy_server.py): restrict proxy to just listed models

2024-02-12 09:30:59 -08:00 · 2024-02-12 09:30:59 -08:00 · 8f989235ea
commit 8f989235ea
parent 5d59fa166c
1 changed files with 18 additions and 3 deletions
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -2372,8 +2372,13 @@ async def chat_completion(
            llm_router is not None and data["model"] in llm_router.deployment_names
        ):  # model in router deployments, calling a specific deployment on the router
            response = await llm_router.acompletion(**data, specific_deployment=True)
-        else:  # router is not set
+        elif user_model is not None:  # `litellm --model <your-model-name>`
            response = await litellm.acompletion(**data)
+        else:
+            raise HTTPException(
+                status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,
+                detail={"message": "Invalid model name passed in"},
+            )

        # Post Call Processing
        data["litellm_status"] = "success"  # used for alerting
@ -2584,8 +2589,13 @@ async def embeddings(
            llm_router is not None and data["model"] in llm_router.deployment_names
        ):  # model in router deployments, calling a specific deployment on the router
            response = await llm_router.aembedding(**data, specific_deployment=True)
-        else:
+        elif user_model is not None:  # `litellm --model <your-model-name>`
            response = await litellm.aembedding(**data)
+        else:
+            raise HTTPException(
+                status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,
+                detail={"message": "Invalid model name passed in"},
+            )

        ### ALERTING ###
        data["litellm_status"] = "success"  # used for alerting
@ -2719,8 +2729,13 @@ async def image_generation(
            response = await llm_router.aimage_generation(
                **data
            )  # ensure this goes the llm_router, router will do the correct alias mapping
-        else:
+        elif user_model is not None:  # `litellm --model <your-model-name>`
            response = await litellm.aimage_generation(**data)
+        else:
+            raise HTTPException(
+                status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,
+                detail={"message": "Invalid model name passed in"},
+            )

        ### ALERTING ###
        data["litellm_status"] = "success"  # used for alerting