mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 12:07:34 +00:00
Use huggingface_hub inference client for TGI inference
This commit is contained in:
parent
21bedc1596
commit
e5bcfdac21
6 changed files with 179 additions and 142 deletions
|
@ -39,8 +39,9 @@ def available_inference_providers() -> List[ProviderSpec]:
|
|||
api=Api.inference,
|
||||
adapter=AdapterSpec(
|
||||
adapter_id="tgi",
|
||||
pip_packages=["text-generation"],
|
||||
pip_packages=["huggingface_hub"],
|
||||
module="llama_toolchain.inference.adapters.tgi",
|
||||
config_class="llama_toolchain.inference.adapters.tgi.TGIImplConfig",
|
||||
),
|
||||
),
|
||||
remote_provider_spec(
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue