Use the lower-level generate_stream() method for correct tool calling

This commit is contained in:
Ashwin Bharambe 2024-09-04 17:36:45 -07:00
parent f355b9b844
commit 046afcb945
2 changed files with 80 additions and 70 deletions

View file

@ -39,7 +39,7 @@ def available_inference_providers() -> List[ProviderSpec]:
api=Api.inference,
adapter=AdapterSpec(
adapter_id="tgi",
pip_packages=["huggingface-hub"],
pip_packages=["text-generation"],
module="llama_toolchain.inference.adapters.tgi",
),
),