Since we are pushing for HF repos, we should accept them in inference configs (#497)

# What does this PR do? As the title says. ## Test Plan This needs 8752149f58 to also land. So the next package (0.0.54) will make this work properly. The test is: ```bash pytest -v -s -m "llama_3b and meta_reference" test_model_registration.py ```
2025-12-04 18:13:44 +00:00 · 2024-11-20 16:14:37 -08:00 · 2024-11-20 16:14:37 -08:00 · e84d4436b5
commit e84d4436b5
parent b3f9e8b2f2
5 changed files with 14 additions and 8 deletions
--- a/llama_stack/providers/inline/inference/vllm/config.py
+++ b/llama_stack/providers/inline/inference/vllm/config.py
@ -48,8 +48,11 @@ class VLLMConfig(BaseModel):
    @classmethod
    def validate_model(cls, model: str) -> str:
        permitted_models = supported_inference_models()
-        if model not in permitted_models:
-            model_list = "\n\t".join(permitted_models)
+
+        descriptors = [m.descriptor() for m in permitted_models]
+        repos = [m.huggingface_repo for m in permitted_models]
+        if model not in (descriptors + repos):
+            model_list = "\n\t".join(repos)
            raise ValueError(
                f"Unknown model: `{model}`. Choose from [\n\t{model_list}\n]"
            )