forked from phoenix-oss/llama-stack-mirror
update EvaluationTask
This commit is contained in:
parent
f107e3229b
commit
d994499f09
3 changed files with 32 additions and 5 deletions
|
@ -49,6 +49,18 @@ EvaluationCandidate = register_schema(
|
|||
|
||||
@json_schema_type
|
||||
class EvaluationTask(BaseModel):
|
||||
"""
|
||||
A task for evaluation. To specify a task, one of the following must be provided:
|
||||
- `benchmark_id`: Run evaluation task against a benchmark_id
|
||||
- `dataset_id` and `grader_ids`: Run evaluation task against a dataset_id and a list of grader_ids
|
||||
- `data_source` and `grader_ids`: Run evaluation task against a data source (e.g. rows, uri, etc.) and a list of grader_ids
|
||||
|
||||
:param benchmark_id: The benchmark ID to evaluate.
|
||||
:param dataset_id: The dataset ID to evaluate.
|
||||
:param data_source: The data source to evaluate.
|
||||
:param grader_ids: The grader IDs to evaluate.
|
||||
"""
|
||||
|
||||
benchmark_id: Optional[str] = None
|
||||
dataset_id: Optional[str] = None
|
||||
data_source: Optional[DataSource] = None
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue