dell tgi fix

2025-12-13 04:22:35 +00:00 · 2024-10-16 15:37:05 -07:00 · 2024-10-16 15:37:05 -07:00 · cfc97df6d5
commit cfc97df6d5
parent c4d5d6bb91
3 changed files with 55 additions and 1 deletions
--- a/llama_stack/providers/adapters/inference/tgi/tgi.py
+++ b/llama_stack/providers/adapters/inference/tgi/tgi.py
@ -52,6 +52,10 @@ class _HfAdapter(Inference, ModelsProtocolPrivate):

    async def list_models(self) -> List[ModelDef]:
        repo = self.model_id
+        # tmp hack to support Dell
+        if repo not in self.huggingface_repo_to_llama_model_id:
+            repo = "meta-llama/Llama-3.1-8B-Instruct"
+
        identifier = self.huggingface_repo_to_llama_model_id[repo]
        return [
            ModelDef(