forked from phoenix-oss/llama-stack-mirror
		
	# What does this PR do? - Configured ruff linter to automatically fix import sorting issues. - Set --exit-non-zero-on-fix to ensure non-zero exit code when fixes are applied. - Enabled the 'I' selection to focus on import-related linting rules. - Ran the linter, and formatted all codebase imports accordingly. - Removed the black dep from the "dev" group since we use ruff Signed-off-by: Sébastien Han <seb@redhat.com> [//]: # (If resolving an issue, uncomment and update the line below) [//]: # (Closes #[issue-number]) ## Test Plan [Describe the tests you ran to verify your changes with result summaries. *Provide clear instructions so the plan can be easily re-executed.*] [//]: # (## Documentation) [//]: # (- [ ] Added a Changelog entry if the change is significant) Signed-off-by: Sébastien Han <seb@redhat.com>
		
			
				
	
	
		
			100 lines
		
	
	
	
		
			2.7 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			100 lines
		
	
	
	
		
			2.7 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # Copyright (c) Meta Platforms, Inc. and affiliates.
 | |
| # All rights reserved.
 | |
| #
 | |
| # This source code is licensed under the terms described in the LICENSE file in
 | |
| # the root directory of this source tree.
 | |
| 
 | |
| import pytest
 | |
| import pytest_asyncio
 | |
| 
 | |
| from llama_stack.apis.models import ModelInput
 | |
| from llama_stack.distribution.datatypes import Api, Provider
 | |
| from llama_stack.providers.inline.scoring.braintrust import BraintrustScoringConfig
 | |
| from llama_stack.providers.tests.resolver import construct_stack_for_test
 | |
| 
 | |
| from ..conftest import ProviderFixture, remote_stack_fixture
 | |
| from ..env import get_env_or_fail
 | |
| 
 | |
| 
 | |
| @pytest.fixture(scope="session")
 | |
| def scoring_remote() -> ProviderFixture:
 | |
|     return remote_stack_fixture()
 | |
| 
 | |
| 
 | |
| @pytest.fixture(scope="session")
 | |
| def judge_model(request):
 | |
|     if hasattr(request, "param"):
 | |
|         return request.param
 | |
|     return request.config.getoption("--judge-model", None)
 | |
| 
 | |
| 
 | |
| @pytest.fixture(scope="session")
 | |
| def scoring_basic() -> ProviderFixture:
 | |
|     return ProviderFixture(
 | |
|         providers=[
 | |
|             Provider(
 | |
|                 provider_id="basic",
 | |
|                 provider_type="inline::basic",
 | |
|                 config={},
 | |
|             )
 | |
|         ],
 | |
|     )
 | |
| 
 | |
| 
 | |
| @pytest.fixture(scope="session")
 | |
| def scoring_braintrust() -> ProviderFixture:
 | |
|     return ProviderFixture(
 | |
|         providers=[
 | |
|             Provider(
 | |
|                 provider_id="braintrust",
 | |
|                 provider_type="inline::braintrust",
 | |
|                 config=BraintrustScoringConfig(
 | |
|                     openai_api_key=get_env_or_fail("OPENAI_API_KEY"),
 | |
|                 ).model_dump(),
 | |
|             )
 | |
|         ],
 | |
|     )
 | |
| 
 | |
| 
 | |
| @pytest.fixture(scope="session")
 | |
| def scoring_llm_as_judge() -> ProviderFixture:
 | |
|     return ProviderFixture(
 | |
|         providers=[
 | |
|             Provider(
 | |
|                 provider_id="llm-as-judge",
 | |
|                 provider_type="inline::llm-as-judge",
 | |
|                 config={},
 | |
|             )
 | |
|         ],
 | |
|     )
 | |
| 
 | |
| 
 | |
| SCORING_FIXTURES = ["basic", "remote", "braintrust", "llm_as_judge"]
 | |
| 
 | |
| 
 | |
| @pytest_asyncio.fixture(scope="session")
 | |
| async def scoring_stack(request, inference_model, judge_model):
 | |
|     fixture_dict = request.param
 | |
| 
 | |
|     providers = {}
 | |
|     provider_data = {}
 | |
|     for key in ["datasetio", "scoring", "inference"]:
 | |
|         fixture = request.getfixturevalue(f"{key}_{fixture_dict[key]}")
 | |
|         providers[key] = fixture.providers
 | |
|         if fixture.provider_data:
 | |
|             provider_data.update(fixture.provider_data)
 | |
| 
 | |
|     test_stack = await construct_stack_for_test(
 | |
|         [Api.scoring, Api.datasetio, Api.inference],
 | |
|         providers,
 | |
|         provider_data,
 | |
|         models=[
 | |
|             ModelInput(model_id=model)
 | |
|             for model in [
 | |
|                 inference_model,
 | |
|                 judge_model,
 | |
|             ]
 | |
|         ],
 | |
|     )
 | |
| 
 | |
|     return test_stack.impls
 |