From 85cad639ca9b6bca62c5eb4d816476aa552943ee Mon Sep 17 00:00:00 2001 From: Xi Yan Date: Tue, 18 Mar 2025 20:16:08 -0700 Subject: [PATCH] Update llama_stack/apis/evaluation/evaluation.py Co-authored-by: Ashwin Bharambe --- llama_stack/apis/evaluation/evaluation.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/llama_stack/apis/evaluation/evaluation.py b/llama_stack/apis/evaluation/evaluation.py index 6b2190417..51f5c371c 100644 --- a/llama_stack/apis/evaluation/evaluation.py +++ b/llama_stack/apis/evaluation/evaluation.py @@ -51,7 +51,7 @@ EvaluationCandidate = register_schema( class EvaluationTask(BaseModel): """ A task for evaluation. To specify a task, one of the following must be provided: - - `benchmark_id`: Run evaluation task against a benchmark_id + - `benchmark_id`: Run evaluation task against a benchmark_id. Use this when you have a curated dataset and have settled on the graders. - `dataset_id` and `grader_ids`: Run evaluation task against a dataset_id and a list of grader_ids - `data_source` and `grader_ids`: Run evaluation task against a data source (e.g. rows, uri, etc.) and a list of grader_ids