fix: Unregister a model from registry if not being served

Signed-off-by: Yuan Tang <terrytangyuan@gmail.com>
This commit is contained in:
Yuan Tang 2025-02-20 13:04:15 -05:00
parent b890d7a611
commit 6abfe0c43b
No known key found for this signature in database

View file

@ -231,7 +231,7 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
pass pass
async def unregister_model(self, model_id: str) -> None: async def unregister_model(self, model_id: str) -> None:
pass await self.register_helper.unregister_model(model_id)
async def completion( async def completion(
self, self,
@ -342,6 +342,7 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
res = self.client.models.list() res = self.client.models.list()
available_models = [m.id for m in res] available_models = [m.id for m in res]
if model.provider_resource_id not in available_models: if model.provider_resource_id not in available_models:
await self.unregister_model(model.provider_resource_id)
raise ValueError( raise ValueError(
f"Model {model.provider_resource_id} is not being served by vLLM. " f"Model {model.provider_resource_id} is not being served by vLLM. "
f"Available models: {', '.join(available_models)}" f"Available models: {', '.join(available_models)}"