single type

2026-01-08 08:21:30 +00:00 · 2025-03-11 23:20:16 -07:00 · 2025-03-11 23:20:16 -07:00 · bec5a46915
commit bec5a46915
parent bc71980769
3 changed files with 639 additions and 166 deletions
--- a/docs/_static/llama-stack-spec.html
+++ b/docs/_static/llama-stack-spec.html
@ -6351,28 +6351,71 @@
                "title": "AggregationFunctionType",
                "description": "A type of aggregation function."
            },
-            "BasicScoringFnParams": {
+            "AnswerCorrectnessScoringFnParams": {
                "type": "object",
                "properties": {
                    "type": {
                        "type": "string",
                        "const": "basic",
                        "default": "basic"
                    },
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
-                        "description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
+                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "answer_correctness",
                        "default": "answer_correctness"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
-                "title": "BasicScoringFnParams",
+                "title": "AnswerCorrectnessScoringFnParams"
-                "description": "Parameters for a non-parameterized scoring function."
+            },
            "AnswerRelevancyScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "answer_relevancy",
                        "default": "answer_relevancy"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "AnswerRelevancyScoringFnParams"
            },
            "AnswerSimilarityScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "answer_similarity",
                        "default": "answer_similarity"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "AnswerSimilarityScoringFnParams"
            },
            "BenchmarkConfig": {
                "type": "object",
@ -6401,6 +6444,116 @@
                "title": "BenchmarkConfig",
                "description": "A benchmark configuration for evaluation."
            },
            "ContextEntityRecallScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "context_entity_recall",
                        "default": "context_entity_recall"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "ContextEntityRecallScoringFnParams"
            },
            "ContextPrecisionScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "context_precision",
                        "default": "context_precision"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "ContextPrecisionScoringFnParams"
            },
            "ContextRecallScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "context_recall",
                        "default": "context_recall"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "ContextRecallScoringFnParams"
            },
            "ContextRelevancyScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "context_relevancy",
                        "default": "context_relevancy"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "ContextRelevancyScoringFnParams"
            },
            "EqualityScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "equality",
                        "default": "equality"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "EqualityScoringFnParams"
            },
            "EvalCandidate": {
                "oneOf": [
                    {
@ -6418,6 +6571,50 @@
                    }
                }
            },
            "FactualityScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "factuality",
                        "default": "factuality"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "FactualityScoringFnParams"
            },
            "FaithfulnessScoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "faithfulness",
                        "default": "faithfulness"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "FaithfulnessScoringFnParams"
            },
            "LLMAsJudgeScoringFnParams": {
                "type": "object",
                "properties": {
@ -6427,26 +6624,22 @@
                        "default": "custom_llm_as_judge"
                    },
                    "judge_model": {
-                        "type": "string",
+                        "type": "string"
                        "description": "The model to use for scoring."
                    },
                    "prompt_template": {
-                        "type": "string",
+                        "type": "string"
                        "description": "(Optional) The prompt template to use for scoring."
                    },
                    "judge_score_regexes": {
                        "type": "array",
                        "items": {
                            "type": "string"
-                        },
+                        }
                        "description": "(Optional) Regexes to extract the score from the judge model's response."
                    },
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
-                        },
+                        }
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
                    }
                },
                "additionalProperties": false,
@ -6454,8 +6647,7 @@
                    "type",
                    "judge_model"
                ],
-                "title": "LLMAsJudgeScoringFnParams",
+                "title": "LLMAsJudgeScoringFnParams"
                "description": "Parameters for a scoring function that uses a judge model to score the answer."
            },
            "ModelCandidate": {
                "type": "object",
@ -6487,35 +6679,65 @@
                "title": "ModelCandidate",
                "description": "A model candidate for evaluation."
            },
-            "RegexParserScoringFnParams": {
+            "RegexParserMathScoringFnParams": {
                "type": "object",
                "properties": {
                    "type": {
                        "type": "string",
                        "const": "regex_parser",
                        "default": "regex_parser"
                    },
                    "parsing_regexes": {
                        "type": "array",
                        "items": {
                            "type": "string"
                        },
-                        "description": "Regexes to extract the answer from generated response"
+                        "description": "(Optional) Regexes to extract the answer from generated response."
                    },
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
-                        "description": "(Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided."
+                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "regex_parser_math_response",
                        "default": "regex_parser_math_response"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "parsing_regexes",
                    "type"
                ],
-                "title": "RegexParserScoringFnParams",
+                "title": "RegexParserMathScoringFnParams"
-                "description": "Parameters for a scoring function that parses the answer from the generated response using regexes, and checks against the expected answer."
+            },
            "RegexParserScoringFnParams": {
                "type": "object",
                "properties": {
                    "parsing_regexes": {
                        "type": "array",
                        "items": {
                            "type": "string"
                        },
                        "description": "(Optional) Regexes to extract the answer from generated response."
                    },
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "regex_parser",
                        "default": "regex_parser"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "parsing_regexes",
                    "type"
                ],
                "title": "RegexParserScoringFnParams"
            },
            "ScoringFnParams": {
                "oneOf": [
@ -6526,7 +6748,40 @@
                        "$ref": "#/components/schemas/RegexParserScoringFnParams"
                    },
                    {
-                        "$ref": "#/components/schemas/BasicScoringFnParams"
+                        "$ref": "#/components/schemas/RegexParserMathScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/EqualityScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/SubsetOfcoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/FactualityScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/FaithfulnessScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/AnswerCorrectnessScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/AnswerRelevancyScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/AnswerSimilarityScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/ContextEntityRecallScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/ContextPrecisionScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/ContextRecallScoringFnParams"
                    },
                    {
                        "$ref": "#/components/schemas/ContextRelevancyScoringFnParams"
                    }
                ],
                "discriminator": {
@ -6534,10 +6789,43 @@
                    "mapping": {
                        "custom_llm_as_judge": "#/components/schemas/LLMAsJudgeScoringFnParams",
                        "regex_parser": "#/components/schemas/RegexParserScoringFnParams",
-                        "basic": "#/components/schemas/BasicScoringFnParams"
+                        "regex_parser_math_response": "#/components/schemas/RegexParserMathScoringFnParams",
                        "equality": "#/components/schemas/EqualityScoringFnParams",
                        "subset_of": "#/components/schemas/SubsetOfcoringFnParams",
                        "factuality": "#/components/schemas/FactualityScoringFnParams",
                        "faithfulness": "#/components/schemas/FaithfulnessScoringFnParams",
                        "answer_correctness": "#/components/schemas/AnswerCorrectnessScoringFnParams",
                        "answer_relevancy": "#/components/schemas/AnswerRelevancyScoringFnParams",
                        "answer_similarity": "#/components/schemas/AnswerSimilarityScoringFnParams",
                        "context_entity_recall": "#/components/schemas/ContextEntityRecallScoringFnParams",
                        "context_precision": "#/components/schemas/ContextPrecisionScoringFnParams",
                        "context_recall": "#/components/schemas/ContextRecallScoringFnParams",
                        "context_relevancy": "#/components/schemas/ContextRelevancyScoringFnParams"
                    }
                }
            },
            "SubsetOfcoringFnParams": {
                "type": "object",
                "properties": {
                    "aggregation_functions": {
                        "type": "array",
                        "items": {
                            "$ref": "#/components/schemas/AggregationFunctionType"
                        },
                        "description": "(Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed."
                    },
                    "type": {
                        "type": "string",
                        "const": "subset_of",
                        "default": "subset_of"
                    }
                },
                "additionalProperties": false,
                "required": [
                    "type"
                ],
                "title": "SubsetOfcoringFnParams"
            },
            "EvaluateRowsRequest": {
                "type": "object",
                "properties": {
@ -9371,7 +9659,8 @@
                },
                "additionalProperties": false,
                "required": [
-                    "scoring_fn_type"
+                    "scoring_fn_type",
                    "params"
                ],
                "title": "RegisterScoringFunctionRequest"
            },
--- a/docs/_static/llama-stack-spec.yaml
+++ b/docs/_static/llama-stack-spec.yaml
@ -4420,26 +4420,60 @@ components:
        - accuracy
      title: AggregationFunctionType
      description: A type of aggregation function.
-    BasicScoringFnParams:
+    AnswerCorrectnessScoringFnParams:
      type: object
      properties:
        type:
          type: string
          const: basic
          default: basic
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
-            (Optional) Aggregation functions to apply to the scores of each row. No
+            (Optional) Aggregation functions to apply to the scores of each row. If
-            aggregation for results is calculated if not provided.
+            not provided, no aggregation will be performed.
        type:
          type: string
          const: answer_correctness
          default: answer_correctness
      additionalProperties: false
      required:
        - type
-      title: BasicScoringFnParams
+      title: AnswerCorrectnessScoringFnParams
    AnswerRelevancyScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
-        Parameters for a non-parameterized scoring function.
+            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: answer_relevancy
          default: answer_relevancy
      additionalProperties: false
      required:
        - type
      title: AnswerRelevancyScoringFnParams
    AnswerSimilarityScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: answer_similarity
          default: answer_similarity
      additionalProperties: false
      required:
        - type
      title: AnswerSimilarityScoringFnParams
    BenchmarkConfig:
      type: object
      properties:
@ -4465,6 +4499,96 @@ components:
      title: BenchmarkConfig
      description: >-
        A benchmark configuration for evaluation.
    ContextEntityRecallScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: context_entity_recall
          default: context_entity_recall
      additionalProperties: false
      required:
        - type
      title: ContextEntityRecallScoringFnParams
    ContextPrecisionScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: context_precision
          default: context_precision
      additionalProperties: false
      required:
        - type
      title: ContextPrecisionScoringFnParams
    ContextRecallScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: context_recall
          default: context_recall
      additionalProperties: false
      required:
        - type
      title: ContextRecallScoringFnParams
    ContextRelevancyScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: context_relevancy
          default: context_relevancy
      additionalProperties: false
      required:
        - type
      title: ContextRelevancyScoringFnParams
    EqualityScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: equality
          default: equality
      additionalProperties: false
      required:
        - type
      title: EqualityScoringFnParams
    EvalCandidate:
      oneOf:
        - $ref: '#/components/schemas/ModelCandidate'
@ -4474,6 +4598,42 @@ components:
        mapping:
          model: '#/components/schemas/ModelCandidate'
          agent: '#/components/schemas/AgentCandidate'
    FactualityScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: factuality
          default: factuality
      additionalProperties: false
      required:
        - type
      title: FactualityScoringFnParams
    FaithfulnessScoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: faithfulness
          default: faithfulness
      additionalProperties: false
      required:
        - type
      title: FaithfulnessScoringFnParams
    LLMAsJudgeScoringFnParams:
      type: object
      properties:
@ -4483,31 +4643,21 @@ components:
          default: custom_llm_as_judge
        judge_model:
          type: string
          description: The model to use for scoring.
        prompt_template:
          type: string
          description: >-
            (Optional) The prompt template to use for scoring.
        judge_score_regexes:
          type: array
          items:
            type: string
          description: >-
            (Optional) Regexes to extract the score from the judge model's response.
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. No
            aggregation for results is calculated if not provided.
      additionalProperties: false
      required:
        - type
        - judge_model
      title: LLMAsJudgeScoringFnParams
      description: >-
        Parameters for a scoring function that uses a judge model to score the answer.
    ModelCandidate:
      type: object
      properties:
@ -4533,44 +4683,107 @@ components:
        - sampling_params
      title: ModelCandidate
      description: A model candidate for evaluation.
-    RegexParserScoringFnParams:
+    RegexParserMathScoringFnParams:
      type: object
      properties:
        type:
          type: string
          const: regex_parser
          default: regex_parser
        parsing_regexes:
          type: array
          items:
            type: string
          description: >-
-            Regexes to extract the answer from generated response
+            (Optional) Regexes to extract the answer from generated response.
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
-            (Optional) Aggregation functions to apply to the scores of each row. No
+            (Optional) Aggregation functions to apply to the scores of each row. If
-            aggregation for results is calculated if not provided.
+            not provided, no aggregation will be performed.
        type:
          type: string
          const: regex_parser_math_response
          default: regex_parser_math_response
      additionalProperties: false
      required:
        - parsing_regexes
        - type
      title: RegexParserMathScoringFnParams
    RegexParserScoringFnParams:
      type: object
      properties:
        parsing_regexes:
          type: array
          items:
            type: string
          description: >-
            (Optional) Regexes to extract the answer from generated response.
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: regex_parser
          default: regex_parser
      additionalProperties: false
      required:
        - parsing_regexes
        - type
      title: RegexParserScoringFnParams
      description: >-
        Parameters for a scoring function that parses the answer from the generated
        response using regexes, and checks against the expected answer.
    ScoringFnParams:
      oneOf:
        - $ref: '#/components/schemas/LLMAsJudgeScoringFnParams'
        - $ref: '#/components/schemas/RegexParserScoringFnParams'
-        - $ref: '#/components/schemas/BasicScoringFnParams'
+        - $ref: '#/components/schemas/RegexParserMathScoringFnParams'
        - $ref: '#/components/schemas/EqualityScoringFnParams'
        - $ref: '#/components/schemas/SubsetOfcoringFnParams'
        - $ref: '#/components/schemas/FactualityScoringFnParams'
        - $ref: '#/components/schemas/FaithfulnessScoringFnParams'
        - $ref: '#/components/schemas/AnswerCorrectnessScoringFnParams'
        - $ref: '#/components/schemas/AnswerRelevancyScoringFnParams'
        - $ref: '#/components/schemas/AnswerSimilarityScoringFnParams'
        - $ref: '#/components/schemas/ContextEntityRecallScoringFnParams'
        - $ref: '#/components/schemas/ContextPrecisionScoringFnParams'
        - $ref: '#/components/schemas/ContextRecallScoringFnParams'
        - $ref: '#/components/schemas/ContextRelevancyScoringFnParams'
      discriminator:
        propertyName: type
        mapping:
          custom_llm_as_judge: '#/components/schemas/LLMAsJudgeScoringFnParams'
          regex_parser: '#/components/schemas/RegexParserScoringFnParams'
-          basic: '#/components/schemas/BasicScoringFnParams'
+          regex_parser_math_response: '#/components/schemas/RegexParserMathScoringFnParams'
          equality: '#/components/schemas/EqualityScoringFnParams'
          subset_of: '#/components/schemas/SubsetOfcoringFnParams'
          factuality: '#/components/schemas/FactualityScoringFnParams'
          faithfulness: '#/components/schemas/FaithfulnessScoringFnParams'
          answer_correctness: '#/components/schemas/AnswerCorrectnessScoringFnParams'
          answer_relevancy: '#/components/schemas/AnswerRelevancyScoringFnParams'
          answer_similarity: '#/components/schemas/AnswerSimilarityScoringFnParams'
          context_entity_recall: '#/components/schemas/ContextEntityRecallScoringFnParams'
          context_precision: '#/components/schemas/ContextPrecisionScoringFnParams'
          context_recall: '#/components/schemas/ContextRecallScoringFnParams'
          context_relevancy: '#/components/schemas/ContextRelevancyScoringFnParams'
    SubsetOfcoringFnParams:
      type: object
      properties:
        aggregation_functions:
          type: array
          items:
            $ref: '#/components/schemas/AggregationFunctionType'
          description: >-
            (Optional) Aggregation functions to apply to the scores of each row. If
            not provided, no aggregation will be performed.
        type:
          type: string
          const: subset_of
          default: subset_of
      additionalProperties: false
      required:
        - type
      title: SubsetOfcoringFnParams
    EvaluateRowsRequest:
      type: object
      properties:
@ -6364,6 +6577,7 @@ components:
      additionalProperties: false
      required:
        - scoring_fn_type
        - params
      title: RegisterScoringFunctionRequest
    RegisterShieldRequest:
      type: object
--- a/llama_stack/apis/scoring_functions/scoring_functions.py
+++ b/llama_stack/apis/scoring_functions/scoring_functions.py
@ -68,110 +68,27 @@ class AggregationFunctionType(Enum):
    accuracy = "accuracy"
-# TODO(xiyan):
+class BasicScoringFnParamsCommon(BaseModel):
-# ============= OPTION 1: SEPARATE ScoringFnParamsType + ScoringFunctionType =============
+    """
-# class ScoringFnParamsType(Enum):
+    :param aggregation_functions: (Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed.
-#     """
+    """
 #     A type of scoring function parameters.
 #     :cvar llm_as_judge: Provide judge model and prompt template.
 #     :cvar regex_parser: Provide regexes to parse the answer from the generated response.
 #     :cvar basic: Parameters for basic non-parameterized scoring function.
 #     """
 #     custom_llm_as_judge = "custom_llm_as_judge"
 #     regex_parser = "regex_parser"
 #     basic = "basic"
 # @json_schema_type
 # class LLMAsJudgeScoringFnParams(BaseModel):
 #     """
 #     Parameters for a scoring function that uses a judge model to score the answer.
 #     :param judge_model: The model to use for scoring.
 #     :param prompt_template: (Optional) The prompt template to use for scoring.
 #     :param judge_score_regexes: (Optional) Regexes to extract the score from the judge model's response.
 #     :param aggregation_functions: (Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided.
 #     """
 #     type: Literal["custom_llm_as_judge"] = "custom_llm_as_judge"
 #     judge_model: str
 #     prompt_template: Optional[str] = None
 #     judge_score_regexes: Optional[List[str]] = Field(
 #         description="Regexes to extract the answer from generated response",
 #         default_factory=list,
 #     )
 #     aggregation_functions: Optional[List[AggregationFunctionType]] = Field(
 #         description="Aggregation functions to apply to the scores of each row",
 #         default_factory=list,
 #     )
 # @json_schema_type
 # class RegexParserScoringFnParams(BaseModel):
 #     """
 #     Parameters for a scoring function that parses the answer from the generated response using regexes, and checks against the expected answer.
 #     :param parsing_regexes: Regexes to extract the answer from generated response
 #     :param aggregation_functions: (Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided.
 #     """
 #     type: Literal["regex_parser"] = "regex_parser"
 #     parsing_regexes: Optional[List[str]] = Field(
 #         description="Regexes to extract the answer from generated response",
 #         default_factory=list,
 #     )
 #     aggregation_functions: Optional[List[AggregationFunctionType]] = Field(
 #         description="Aggregation functions to apply to the scores of each row",
 #         default_factory=list,
 #     )
 # @json_schema_type
 # class BasicScoringFnParams(BaseModel):
 #     """
 #     Parameters for a non-parameterized scoring function.
 #     :param aggregation_functions: (Optional) Aggregation functions to apply to the scores of each row. No aggregation for results is calculated if not provided.
 #     """
 #     type: Literal["basic"] = "basic"
 #     aggregation_functions: Optional[List[AggregationFunctionType]] = Field(
 #         description="Aggregation functions to apply to the scores of each row",
 #         default_factory=list,
 #     )
 # ScoringFnParams = register_schema(
 #     Annotated[
 #         Union[
 #             LLMAsJudgeScoringFnParams,
 #             RegexParserScoringFnParams,
 #             BasicScoringFnParams,
 #         ],
 #         Field(discriminator="type"),
 #     ],
 #     name="ScoringFnParams",
 # )
 # ============= END OF OPTION 1 =============
 # TODO(xiyan):
 # ============= OPTION 2: MERGE ScoringFnParamsType + ScoringFunctionType into ScoringFunctionType =============
 class RegexParserScoringFnParamsCommon(BaseModel):
    parsing_regexes: Optional[List[str]] = Field(
        description="Regexes to extract the answer from generated response",
        default_factory=list,
    )
    aggregation_functions: Optional[List[AggregationFunctionType]] = Field(
        description="Aggregation functions to apply to the scores of each row",
        default_factory=list,
    )
-class BasicScoringFnParamsCommon(BaseModel):
+class RegexParserScoringFnParamsCommon(BaseModel):
    """
    :param parsing_regexes: (Optional) Regexes to extract the answer from generated response.
    :param aggregation_functions: (Optional) Aggregation functions to apply to the scores of each row. If not provided, no aggregation will be performed.
    """
    parsing_regexes: List[str] = Field(
        description="Regexes to extract the answer from generated response",
        default_factory=list,
    )
    aggregation_functions: Optional[List[AggregationFunctionType]] = Field(
        description="Aggregation functions to apply to the scores of each row",
        default_factory=list,
@ -198,6 +115,51 @@ class SubsetOfcoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["subset_of"] = "subset_of"
@json_schema_type
 class FactualityScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["factuality"] = "factuality"
@json_schema_type
 class FaithfulnessScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["faithfulness"] = "faithfulness"
@json_schema_type
 class AnswerCorrectnessScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["answer_correctness"] = "answer_correctness"
@json_schema_type
 class AnswerRelevancyScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["answer_relevancy"] = "answer_relevancy"
@json_schema_type
 class AnswerSimilarityScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["answer_similarity"] = "answer_similarity"
@json_schema_type
 class ContextEntityRecallScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["context_entity_recall"] = "context_entity_recall"
@json_schema_type
 class ContextPrecisionScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["context_precision"] = "context_precision"
@json_schema_type
 class ContextRecallScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["context_recall"] = "context_recall"
@json_schema_type
 class ContextRelevancyScoringFnParams(BasicScoringFnParamsCommon):
    type: Literal["context_relevancy"] = "context_relevancy"
@json_schema_type
 class LLMAsJudgeScoringFnParams(BaseModel):
    type: Literal["custom_llm_as_judge"] = "custom_llm_as_judge"
@ -221,6 +183,15 @@ ScoringFnParams = register_schema(
            RegexParserMathScoringFnParams,
            EqualityScoringFnParams,
            SubsetOfcoringFnParams,
            FactualityScoringFnParams,
            FaithfulnessScoringFnParams,
            AnswerCorrectnessScoringFnParams,
            AnswerRelevancyScoringFnParams,
            AnswerSimilarityScoringFnParams,
            ContextEntityRecallScoringFnParams,
            ContextPrecisionScoringFnParams,
            ContextRecallScoringFnParams,
            ContextRelevancyScoringFnParams,
        ],
        Field(discriminator="type"),
    ],
@ -284,9 +255,8 @@ class ScoringFunctions(Protocol):
    @webmethod(route="/scoring-functions", method="POST")
    async def register_scoring_function(
        self,
-        # TODO(xiyan): scoring_fn_type will not be needed for OPTION 2
+        scoring_fn_type: ScoringFunctionType,
-        # scoring_fn_type: ScoringFunctionType,
+        params: ScoringFnParams = None,
        params: Optional[ScoringFnParams] = None,
        scoring_fn_id: Optional[str] = None,
        metadata: Optional[Dict[str, Any]] = None,
    ) -> ScoringFn:
@ -294,7 +264,7 @@ class ScoringFunctions(Protocol):
        Register a new scoring function with given parameters.
        Only valid scoring function type that can be parameterized can be registered.
-        # :param scoring_fn_type: The type of scoring function to register.
+        :param scoring_fn_type: The type of scoring function to register.
        :param params: The parameters for the scoring function.
        :param scoring_fn_id: (Optional) The ID of the scoring function to register. If not provided, a random ID will be generated.
        :param metadata: (Optional) Any additional metadata to be associated with the scoring function.