update EvaluationTask

2025-03-18 19:30:01 -07:00 · 2025-03-18 19:30:01 -07:00 · d994499f09
commit d994499f09
parent f107e3229b
3 changed files with 32 additions and 5 deletions
--- a/llama_stack/apis/evaluation/evaluation.py
+++ b/llama_stack/apis/evaluation/evaluation.py
@ -49,6 +49,18 @@ EvaluationCandidate = register_schema(

@json_schema_type
 class EvaluationTask(BaseModel):
+    """
+    A task for evaluation. To specify a task, one of the following must be provided:
+    - `benchmark_id`: Run evaluation task against a benchmark_id
+    - `dataset_id` and `grader_ids`: Run evaluation task against a dataset_id and a list of grader_ids
+    - `data_source` and `grader_ids`: Run evaluation task against a data source (e.g. rows, uri, etc.) and a list of grader_ids
+
+    :param benchmark_id: The benchmark ID to evaluate.
+    :param dataset_id: The dataset ID to evaluate.
+    :param data_source: The data source to evaluate.
+    :param grader_ids: The grader IDs to evaluate.
+    """
+
    benchmark_id: Optional[str] = None
    dataset_id: Optional[str] = None
    data_source: Optional[DataSource] = None