huggingface provider

2025-12-17 14:52:37 +00:00 · 2024-11-07 15:20:22 -08:00 · 2024-11-07 15:20:22 -08:00 · d1633dc412
commit d1633dc412
parent cc6edf6287
5 changed files with 99 additions and 34 deletions
--- a/llama_stack/apis/eval/eval.py
+++ b/llama_stack/apis/eval/eval.py
@ -40,6 +40,10 @@ EvalCandidate = Annotated[
 class BenchmarkEvalTaskConfig(BaseModel):
    type: Literal["benchmark"] = "benchmark"
    eval_candidate: EvalCandidate
+    num_examples: Optional[int] = Field(
+        description="Number of examples to evaluate (useful for quick debugging), if not provided, all examples in the dataset will be evaluated",
+        default=None,
+    )


@json_schema_type
@ -50,6 +54,10 @@ class AppEvalTaskConfig(BaseModel):
        description="Map between scoring function id and parameters for each scoring function you want to run",
        default_factory=dict,
    )
+    num_examples: Optional[int] = Field(
+        description="Number of examples to evaluate (useful for quick debugging), if not provided, all examples in the dataset will be evaluated",
+        default=None,
+    )
    # we could optinally add any specific dataset config here