single type

This commit is contained in:
Xi Yan 2025-03-11 23:20:16 -07:00
parent bc71980769
commit bec5a46915
3 changed files with 639 additions and 166 deletions

View file

@ -6351,28 +6351,71 @@
"title": "AggregationFunctionType",
"description": "A type of aggregation function."
},
"BasicScoringFnParams": {
"AnswerCorrectnessScoringFnParams": {
"type": "object",
"properties": {
"type": {
"type": "string",
"const": "basic",
"default": "basic"
},
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "answer_correctness",
"default": "answer_correctness"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "BasicScoringFnParams",
"description": "Parameters for a non-parameterized scoring function."
"title": "AnswerCorrectnessScoringFnParams"
},
"AnswerRelevancyScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "answer_relevancy",
"default": "answer_relevancy"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "AnswerRelevancyScoringFnParams"
},
"AnswerSimilarityScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "answer_similarity",
"default": "answer_similarity"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "AnswerSimilarityScoringFnParams"
},
"BenchmarkConfig": {
"type": "object",
@ -6401,6 +6444,116 @@
"title": "BenchmarkConfig",
"description": "A benchmark configuration for evaluation."
},
"ContextEntityRecallScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "context_entity_recall",
"default": "context_entity_recall"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "ContextEntityRecallScoringFnParams"
},
"ContextPrecisionScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "context_precision",
"default": "context_precision"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "ContextPrecisionScoringFnParams"
},
"ContextRecallScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "context_recall",
"default": "context_recall"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "ContextRecallScoringFnParams"
},
"ContextRelevancyScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "context_relevancy",
"default": "context_relevancy"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "ContextRelevancyScoringFnParams"
},
"EqualityScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "equality",
"default": "equality"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "EqualityScoringFnParams"
},
"EvalCandidate": {
"oneOf": [
{
@ -6418,6 +6571,50 @@
}
}
},
"FactualityScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "factuality",
"default": "factuality"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "FactualityScoringFnParams"
},
"FaithfulnessScoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "faithfulness",
"default": "faithfulness"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "FaithfulnessScoringFnParams"
},
"LLMAsJudgeScoringFnParams": {
"type": "object",
"properties": {
@ -6427,26 +6624,22 @@
"default": "custom_llm_as_judge"
},
"judge_model": {
"type": "string",
"description": "The model to use for scoring."
"type": "string"
},
"prompt_template": {
"type": "string",
"description": "(Optional) The prompt template to use for scoring."
"type": "string"
},
"judge_score_regexes": {
"type": "array",
"items": {
"type": "string"
},
"description": "(Optional) Regexes to extract the score from the judge model's response."
}
},
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
}
}
},
"additionalProperties": false,
@ -6454,8 +6647,7 @@
"type",
"judge_model"
],
"title": "LLMAsJudgeScoringFnParams",
"description": "Parameters for a scoring function that uses a judge model to score the answer."
"title": "LLMAsJudgeScoringFnParams"
},
"ModelCandidate": {
"type": "object",
@ -6487,35 +6679,65 @@
"title": "ModelCandidate",
"description": "A model candidate for evaluation."
},
"RegexParserScoringFnParams": {
"RegexParserMathScoringFnParams": {
"type": "object",
"properties": {
"type": {
"type": "string",
"const": "regex_parser",
"default": "regex_parser"
},
"parsing_regexes": {
"type": "array",
"items": {
"type": "string"
},
"description": "Regexes to extract the answer from generated response"
"description": "(Optional) Regexes to extract the answer from generated response."
},
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "regex_parser_math_response",
"default": "regex_parser_math_response"
}
},
"additionalProperties": false,
"required": [
"parsing_regexes",
"type"
],
"title": "RegexParserScoringFnParams",
"description": "Parameters for a scoring function that parses the answer from the generated response using regexes, and checks against the expected answer."
"title": "RegexParserMathScoringFnParams"
},
"RegexParserScoringFnParams": {
"type": "object",
"properties": {
"parsing_regexes": {
"type": "array",
"items": {
"type": "string"
},
"description": "(Optional) Regexes to extract the answer from generated response."
},
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "regex_parser",
"default": "regex_parser"
}
},
"additionalProperties": false,
"required": [
"parsing_regexes",
"type"
],
"title": "RegexParserScoringFnParams"
},
"ScoringFnParams": {
"oneOf": [
@ -6526,7 +6748,40 @@
"$ref": "#/components/schemas/RegexParserScoringFnParams"
},
{
"$ref": "#/components/schemas/BasicScoringFnParams"
"$ref": "#/components/schemas/RegexParserMathScoringFnParams"
},
{
"$ref": "#/components/schemas/EqualityScoringFnParams"
},
{
"$ref": "#/components/schemas/SubsetOfcoringFnParams"
},
{
"$ref": "#/components/schemas/FactualityScoringFnParams"
},
{
"$ref": "#/components/schemas/FaithfulnessScoringFnParams"
},
{
"$ref": "#/components/schemas/AnswerCorrectnessScoringFnParams"
},
{
"$ref": "#/components/schemas/AnswerRelevancyScoringFnParams"
},
{
"$ref": "#/components/schemas/AnswerSimilarityScoringFnParams"
},
{
"$ref": "#/components/schemas/ContextEntityRecallScoringFnParams"
},
{
"$ref": "#/components/schemas/ContextPrecisionScoringFnParams"
},
{
"$ref": "#/components/schemas/ContextRecallScoringFnParams"
},
{
"$ref": "#/components/schemas/ContextRelevancyScoringFnParams"
}
],
"discriminator": {
@ -6534,10 +6789,43 @@
"mapping": {
"custom_llm_as_judge": "#/components/schemas/LLMAsJudgeScoringFnParams",
"regex_parser": "#/components/schemas/RegexParserScoringFnParams",
"basic": "#/components/schemas/BasicScoringFnParams"
"regex_parser_math_response": "#/components/schemas/RegexParserMathScoringFnParams",
"equality": "#/components/schemas/EqualityScoringFnParams",
"subset_of": "#/components/schemas/SubsetOfcoringFnParams",
"factuality": "#/components/schemas/FactualityScoringFnParams",
"faithfulness": "#/components/schemas/FaithfulnessScoringFnParams",
"answer_correctness": "#/components/schemas/AnswerCorrectnessScoringFnParams",
"answer_relevancy": "#/components/schemas/AnswerRelevancyScoringFnParams",
"answer_similarity": "#/components/schemas/AnswerSimilarityScoringFnParams",
"context_entity_recall": "#/components/schemas/ContextEntityRecallScoringFnParams",
"context_precision": "#/components/schemas/ContextPrecisionScoringFnParams",
"context_recall": "#/components/schemas/ContextRecallScoringFnParams",
"context_relevancy": "#/components/schemas/ContextRelevancyScoringFnParams"
}
}
},
"SubsetOfcoringFnParams": {
"type": "object",
"properties": {
"aggregation_functions": {
"type": "array",
"items": {
"$ref": "#/components/schemas/AggregationFunctionType"
},
"description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
},
"type": {
"type": "string",
"const": "subset_of",
"default": "subset_of"
}
},
"additionalProperties": false,
"required": [
"type"
],
"title": "SubsetOfcoringFnParams"
},
"EvaluateRowsRequest": {
"type": "object",
"properties": {
@ -9371,7 +9659,8 @@
},
"additionalProperties": false,
"required": [
"scoring_fn_type"
"scoring_fn_type",
"params"
],
"title": "RegisterScoringFunctionRequest"
},