mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-09 19:29:18 +00:00
rag correctness scorer w/ custom dataset
This commit is contained in:
parent
ec6c63ba57
commit
9cc0a54f0b
4 changed files with 18 additions and 4 deletions
|
|
@ -136,6 +136,9 @@ async def run_main(host: str, port: int, eval_dataset_path: str = ""):
|
|||
dataset_def=CustomDatasetDef(
|
||||
identifier="rag-evals",
|
||||
url=data_url_from_file(eval_dataset_path),
|
||||
rename_columns_map={
|
||||
"query": "input_query",
|
||||
},
|
||||
)
|
||||
)
|
||||
cprint(response, "cyan")
|
||||
|
|
@ -150,6 +153,9 @@ async def run_main(host: str, port: int, eval_dataset_path: str = ""):
|
|||
eval_scoring_config=EvaluateScoringConfig(
|
||||
scorer_config_list=[
|
||||
EvaluateSingleScorerConfig(scorer_name="accuracy"),
|
||||
EvaluateSingleScorerConfig(
|
||||
scorer_name="braintrust::answer-correctness"
|
||||
),
|
||||
]
|
||||
),
|
||||
)
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue