Use huggingface_hub inference client for TGI inference

This commit is contained in:
Celina Hanouti 2024-09-05 18:29:04 +02:00
parent 21bedc1596
commit e5bcfdac21
6 changed files with 179 additions and 142 deletions

View file

@ -0,0 +1,22 @@
# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
#
# This source code is licensed under the terms described in the LICENSE file in
# the root directory of this source tree.
from typing import Optional
from llama_models.schema_utils import json_schema_type
from pydantic import BaseModel, Field, field_validator
@json_schema_type
class TGIImplConfig(BaseModel):
url: str = Field(
default="https://api-inference.huggingface.co",
description="The URL for the TGI endpoint",
)
api_token: Optional[str] = Field(
default="",
description="The HF token for Hugging Face Inference Endpoints",
)