dell tgi fix

This commit is contained in:
Xi Yan 2024-10-16 15:37:05 -07:00
parent c4d5d6bb91
commit cfc97df6d5
3 changed files with 55 additions and 1 deletions

View file

@ -52,6 +52,10 @@ class _HfAdapter(Inference, ModelsProtocolPrivate):
async def list_models(self) -> List[ModelDef]:
repo = self.model_id
# tmp hack to support Dell
if repo not in self.huggingface_repo_to_llama_model_id:
repo = "meta-llama/Llama-3.1-8B-Instruct"
identifier = self.huggingface_repo_to_llama_model_id[repo]
return [
ModelDef(