Add inference test fixture for tgi

2025-12-17 05:32:36 +00:00 · 2024-11-23 22:52:06 -08:00 · 2024-11-23 22:52:06 -08:00 · 3cace74458
commit 3cace74458
parent 9ddda91180
1 changed files with 18 additions and 0 deletions
--- a/llama_stack/providers/tests/inference/fixtures.py
+++ b/llama_stack/providers/tests/inference/fixtures.py
@ -20,6 +20,7 @@ from llama_stack.providers.remote.inference.bedrock import BedrockConfig
 from llama_stack.providers.remote.inference.fireworks import FireworksImplConfig
 from llama_stack.providers.remote.inference.nvidia import NVIDIAConfig
 from llama_stack.providers.remote.inference.ollama import OllamaImplConfig
 from llama_stack.providers.remote.inference.tgi import TGIImplConfig
 from llama_stack.providers.remote.inference.together import TogetherImplConfig
 from llama_stack.providers.remote.inference.vllm import VLLMInferenceAdapterConfig
 from llama_stack.providers.tests.resolver import construct_stack_for_test
@ -156,6 +157,22 @@ def inference_nvidia() -> ProviderFixture:
    )
@pytest.fixture(scope="session")
 def inference_tgi() -> ProviderFixture:
    return ProviderFixture(
        providers=[
            Provider(
                provider_id="tgi",
                provider_type="remote::tgi",
                config=TGIImplConfig(
                    url=get_env_or_fail("TGI_URL"),
                    api_token=get_env_or_fail("TGI_API_TOKEN"),
                ).model_dump(),
            )
        ],
    )
 def get_model_short_name(model_name: str) -> str:
    """Convert model name to a short test identifier.
@ -190,6 +207,7 @@ INFERENCE_FIXTURES = [
    "remote",
    "bedrock",
    "nvidia",
    "tgi",
 ]