This commit is contained in:
Xi Yan 2025-03-11 22:45:48 -07:00
parent 11e57e17e6
commit f9ea90c4f7
3 changed files with 90 additions and 20 deletions

View file

@ -6348,7 +6348,8 @@
"categorical_count",
"accuracy"
],
"title": "AggregationFunctionType"
"title": "AggregationFunctionType",
"description": "A type of aggregation function."
},
"BasicScoringFnParams": {
"type": "object",
@ -6362,14 +6363,16 @@
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
}
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "BasicScoringFnParams"
"title": "BasicScoringFnParams",
"description": "Parameters for a non-parameterized scoring function."
},
"BenchmarkConfig": {
"type": "object",
@ -6420,26 +6423,30 @@
"properties": {
"type": {
"type": "string",
"const": "llm_as_judge",
"default": "llm_as_judge"
"const": "custom_llm_as_judge",
"default": "custom_llm_as_judge"
},
"judge_model": {
"type": "string"
"type": "string",
"description": "The model to use for scoring."
},
"prompt_template": {
"type": "string"
"type": "string",
"description": "(Optional) The prompt template to use for scoring."
},
"judge_score_regexes": {
"type": "array",
"items": {
"type": "string"
}
},
"description": "(Optional) Regexes to extract the score from the judge model's response."
},
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
}
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
}
},
"additionalProperties": false,
@ -6447,7 +6454,8 @@
"type",
"judge_model"
],
"title": "LLMAsJudgeScoringFnParams"
"title": "LLMAsJudgeScoringFnParams",
"description": "Parameters for a scoring function that uses a judge model to score the answer."
},
"ModelCandidate": {
"type": "object",
@ -6491,20 +6499,23 @@
"type": "array",
"items": {
"type": "string"
}
},
"description": "Regexes to extract the answer from generated response"
},
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
}
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "RegexParserScoringFnParams"
"title": "RegexParserScoringFnParams",
"description": "Parameters for a scoring function that parses the answer from the generated response using regexes, and checks against the expected answer."
},
"ScoringFnParams": {
"oneOf": [
@ -6521,7 +6532,7 @@
"discriminator": {
"propertyName": "type",
"mapping": {
"llm_as_judge": "#/components/schemas/LLMAsJudgeScoringFnParams",
"custom_llm_as_judge": "#/components/schemas/LLMAsJudgeScoringFnParams",
"regex_parser": "#/components/schemas/RegexParserScoringFnParams",
"basic": "#/components/schemas/BasicScoringFnParams"
}