huggingface provider

This commit is contained in:
Xi Yan 2024-11-07 15:20:22 -08:00
parent cc6edf6287
commit d1633dc412
5 changed files with 99 additions and 34 deletions

View file

@ -40,6 +40,10 @@ EvalCandidate = Annotated[
class BenchmarkEvalTaskConfig(BaseModel):
type: Literal["benchmark"] = "benchmark"
eval_candidate: EvalCandidate
num_examples: Optional[int] = Field(
description="Number of examples to evaluate (useful for quick debugging), if not provided, all examples in the dataset will be evaluated",
default=None,
)
@json_schema_type
@ -50,6 +54,10 @@ class AppEvalTaskConfig(BaseModel):
description="Map between scoring function id and parameters for each scoring function you want to run",
default_factory=dict,
)
num_examples: Optional[int] = Field(
description="Number of examples to evaluate (useful for quick debugging), if not provided, all examples in the dataset will be evaluated",
default=None,
)
# we could optinally add any specific dataset config here