forked from phoenix-oss/llama-stack-mirror
update
This commit is contained in:
parent
398319fe7a
commit
5e817cd56a
3 changed files with 187 additions and 187 deletions
|
@ -148,9 +148,9 @@ class Evaluation(Protocol):
|
|||
...
|
||||
|
||||
@webmethod(route="/evaluation/grading", method="POST")
|
||||
async def grading(self, task: EvaluationTask) -> EvaluationJob:
|
||||
async def grade(self, task: EvaluationTask) -> EvaluationJob:
|
||||
"""
|
||||
Schedule a grading job, by grading generated results. The generated results are expected to be in the dataset.
|
||||
Schedule a grading job, by grading generated (model or agent) results. The generated results are expected to be in the dataset.
|
||||
|
||||
:param task: The task to evaluate. One of:
|
||||
- BenchmarkEvaluationTask: Run evaluation task against a benchmark_id
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue