Fix Dell distro and TGI inference

2025-12-23 00:52:26 +00:00 · 2025-08-08 12:29:33 -04:00 · 2025-08-08 12:29:33 -04:00 · ad66968909
commit ad66968909
parent 9b70bb9d4b
2 changed files with 4 additions and 1 deletions
--- a/llama_stack/providers/remote/inference/tgi/tgi.py
+++ b/llama_stack/providers/remote/inference/tgi/tgi.py
@ -309,7 +309,7 @@ class TGIAdapter(_HfAdapter):
            raise ValueError("You must provide a URL in run.yaml (or via the TGI_URL environment variable) to use TGI.")
        log.info(f"Initializing TGI client with url={config.url}")
        self.client = AsyncInferenceClient(
-            model=config.url,
+            model=config.url,provider="hf-inference"
        )
        endpoint_info = await self.client.get_endpoint_info()
        self.max_tokens = endpoint_info["max_total_tokens"]