Use huggingface_hub inference client for TGI inference

2025-10-05 12:21:52 +00:00 · 2024-09-05 18:29:04 +02:00 · 2024-09-05 18:29:04 +02:00 · e5bcfdac21
commit e5bcfdac21
parent 21bedc1596
6 changed files with 179 additions and 142 deletions
--- a/llama_toolchain/inference/adapters/tgi/config.py
+++ b/llama_toolchain/inference/adapters/tgi/config.py
@ -0,0 +1,22 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+from typing import Optional
+
+from llama_models.schema_utils import json_schema_type
+from pydantic import BaseModel, Field, field_validator
+
+
+@json_schema_type
+class TGIImplConfig(BaseModel):
+    url: str = Field(
+        default="https://api-inference.huggingface.co",
+        description="The URL for the TGI endpoint",
+    )
+    api_token: Optional[str] = Field(
+        default="",
+        description="The HF token for Hugging Face Inference Endpoints",
+    )