This commit is contained in:
Xi Yan 2025-03-13 00:03:06 -07:00
parent 10f6528164
commit c87b7006fc
3 changed files with 21 additions and 21 deletions

View file

@ -6813,8 +6813,8 @@
"post-training/messages", "post-training/messages",
"eval/question-answer", "eval/question-answer",
"eval/messages-answer", "eval/messages-answer",
"scoring/question-generation-answer", "scoring/question-answer-generation",
"scoring/messages-generation-answer", "scoring/messages-answer-generation",
"scoring/generation-answer" "scoring/generation-answer"
], ],
"title": "DatasetPurpose", "title": "DatasetPurpose",
@ -8797,8 +8797,8 @@
"post-training/messages", "post-training/messages",
"eval/question-answer", "eval/question-answer",
"eval/messages-answer", "eval/messages-answer",
"scoring/question-generation-answer", "scoring/question-answer-generation",
"scoring/messages-generation-answer", "scoring/messages-answer-generation",
"scoring/generation-answer" "scoring/generation-answer"
], ],
"title": "DatasetPurpose", "title": "DatasetPurpose",
@ -9895,11 +9895,11 @@
"post-training/messages", "post-training/messages",
"eval/question-answer", "eval/question-answer",
"eval/messages-answer", "eval/messages-answer",
"scoring/question-generation-answer", "scoring/question-answer-generation",
"scoring/messages-generation-answer", "scoring/messages-answer-generation",
"scoring/generation-answer" "scoring/generation-answer"
], ],
"description": "The purpose of the dataset. One of - \"post-training/messages\": The dataset contains a messages column with list of messages for post-training. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, world!\"}, {\"role\": \"assistant\", \"content\": \"Hello, world!\"}, ] } - \"eval/question-answer\": The dataset contains a question column and an answer column for evaluation. { \"question\": \"What is the capital of France?\", \"answer\": \"Paris\" } - \"eval/messages-answer\": The dataset contains a messages column with list of messages and an answer column for evaluation. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, my name is John Doe.\"}, {\"role\": \"assistant\", \"content\": \"Hello, John Doe. How can I help you today?\"}, {\"role\": \"user\", \"content\": \"What's my name?\"}, ], \"answer\": \"John Doe\" } - \"scoring/question-generation-answer\": The dataset contains a question column, a generation column and an answer column for scoring. { \"question\": \"What is the capital of France?\", \"generation\": \"Paris\", \"answer\": \"Paris\" } - \"scoring/messages-generation-answer\": The dataset contains a messages column with list of messages, a generation column and an answer column for scoring. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, my name is John Doe.\"}, {\"role\": \"assistant\", \"content\": \"Hello, John Doe. How can I help you today?\"}, {\"role\": \"user\", \"content\": \"What's my name?\"}, ], \"generation\": \"John Doe\", \"answer\": \"John Doe\" } - \"scoring/generation-answer\": The dataset contains a generation column and an answer column for scoring. { \"generation\": \"Paris\", \"answer\": \"Paris\" }" "description": "The purpose of the dataset. One of - \"post-training/messages\": The dataset contains a messages column with list of messages for post-training. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, world!\"}, {\"role\": \"assistant\", \"content\": \"Hello, world!\"}, ] } - \"eval/question-answer\": The dataset contains a question column and an answer column for evaluation. { \"question\": \"What is the capital of France?\", \"answer\": \"Paris\" } - \"eval/messages-answer\": The dataset contains a messages column with list of messages and an answer column for evaluation. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, my name is John Doe.\"}, {\"role\": \"assistant\", \"content\": \"Hello, John Doe. How can I help you today?\"}, {\"role\": \"user\", \"content\": \"What's my name?\"}, ], \"answer\": \"John Doe\" } - \"scoring/question-answer-generation\": The dataset contains a question column, a generation column and an answer column for scoring. { \"question\": \"What is the capital of France?\", \"generation\": \"Paris\", \"answer\": \"Paris\" } - \"scoring/messages-answer-generation\": The dataset contains a messages column with list of messages, a generation column and an answer column for scoring. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, my name is John Doe.\"}, {\"role\": \"assistant\", \"content\": \"Hello, John Doe. How can I help you today?\"}, {\"role\": \"user\", \"content\": \"What's my name?\"}, ], \"generation\": \"John Doe\", \"answer\": \"John Doe\" } - \"scoring/generation-answer\": The dataset contains a generation column and an answer column for scoring. { \"generation\": \"Paris\", \"answer\": \"Paris\" }"
}, },
"source": { "source": {
"$ref": "#/components/schemas/DataSource", "$ref": "#/components/schemas/DataSource",

View file

@ -4718,8 +4718,8 @@ components:
- post-training/messages - post-training/messages
- eval/question-answer - eval/question-answer
- eval/messages-answer - eval/messages-answer
- scoring/question-generation-answer - scoring/question-answer-generation
- scoring/messages-generation-answer - scoring/messages-answer-generation
- scoring/generation-answer - scoring/generation-answer
title: DatasetPurpose title: DatasetPurpose
description: >- description: >-
@ -6075,8 +6075,8 @@ components:
- post-training/messages - post-training/messages
- eval/question-answer - eval/question-answer
- eval/messages-answer - eval/messages-answer
- scoring/question-generation-answer - scoring/question-answer-generation
- scoring/messages-generation-answer - scoring/messages-answer-generation
- scoring/generation-answer - scoring/generation-answer
title: DatasetPurpose title: DatasetPurpose
description: >- description: >-
@ -6786,8 +6786,8 @@ components:
- post-training/messages - post-training/messages
- eval/question-answer - eval/question-answer
- eval/messages-answer - eval/messages-answer
- scoring/question-generation-answer - scoring/question-answer-generation
- scoring/messages-generation-answer - scoring/messages-answer-generation
- scoring/generation-answer - scoring/generation-answer
description: >- description: >-
The purpose of the dataset. One of - "post-training/messages": The dataset The purpose of the dataset. One of - "post-training/messages": The dataset
@ -6800,10 +6800,10 @@ components:
column for evaluation. { "messages": [ {"role": "user", "content": "Hello, column for evaluation. { "messages": [ {"role": "user", "content": "Hello,
my name is John Doe."}, {"role": "assistant", "content": "Hello, John my name is John Doe."}, {"role": "assistant", "content": "Hello, John
Doe. How can I help you today?"}, {"role": "user", "content": "What's Doe. How can I help you today?"}, {"role": "user", "content": "What's
my name?"}, ], "answer": "John Doe" } - "scoring/question-generation-answer": my name?"}, ], "answer": "John Doe" } - "scoring/question-answer-generation":
The dataset contains a question column, a generation column and an answer The dataset contains a question column, a generation column and an answer
column for scoring. { "question": "What is the capital of France?", "generation": column for scoring. { "question": "What is the capital of France?", "generation":
"Paris", "answer": "Paris" } - "scoring/messages-generation-answer": The "Paris", "answer": "Paris" } - "scoring/messages-answer-generation": The
dataset contains a messages column with list of messages, a generation dataset contains a messages column with list of messages, a generation
column and an answer column for scoring. { "messages": [ {"role": "user", column and an answer column for scoring. { "messages": [ {"role": "user",
"content": "Hello, my name is John Doe."}, {"role": "assistant", "content": "content": "Hello, my name is John Doe."}, {"role": "assistant", "content":

View file

@ -38,13 +38,13 @@ class DatasetPurpose(Enum):
], ],
"answer": "John Doe" "answer": "John Doe"
} }
:cvar scoring/question-generation-answer: The dataset contains a question column, a generation column and an answer column. :cvar scoring/question-answer-generation: The dataset contains a question column, a generation column and an answer column.
{ {
"question": "What is the capital of France?", "question": "What is the capital of France?",
"generation": "Paris", "generation": "Paris",
"answer": "Paris" "answer": "Paris"
} }
:cvar scoring/messages-generation-answer: The dataset contains a messages column with list of messages, a generation column and an answer column. :cvar scoring/messages-answer-generation: The dataset contains a messages column with list of messages, a generation column and an answer column.
{ {
"messages": [ "messages": [
{"role": "user", "content": "Hello, my name is John Doe."}, {"role": "user", "content": "Hello, my name is John Doe."},
@ -65,8 +65,8 @@ class DatasetPurpose(Enum):
eval_question_answer = "eval/question-answer" eval_question_answer = "eval/question-answer"
eval_messages_answer = "eval/messages-answer" eval_messages_answer = "eval/messages-answer"
scoring_question_generation_answer = "scoring/question-generation-answer" scoring_question_answer_generation = "scoring/question-answer-generation"
scoring_messages_generation_answer = "scoring/messages-generation-answer" scoring_messages_answer_generation = "scoring/messages-answer-generation"
scoring_generation_answer = "scoring/generation-answer" scoring_generation_answer = "scoring/generation-answer"
# TODO: add more schemas here # TODO: add more schemas here
@ -206,13 +206,13 @@ class Datasets(Protocol):
], ],
"answer": "John Doe" "answer": "John Doe"
} }
- "scoring/question-generation-answer": The dataset contains a question column, a generation column and an answer column for scoring. - "scoring/question-answer-generation": The dataset contains a question column, a generation column and an answer column for scoring.
{ {
"question": "What is the capital of France?", "question": "What is the capital of France?",
"generation": "Paris", "generation": "Paris",
"answer": "Paris" "answer": "Paris"
} }
- "scoring/messages-generation-answer": The dataset contains a messages column with list of messages, a generation column and an answer column for scoring. - "scoring/messages-answer-generation": The dataset contains a messages column with list of messages, a generation column and an answer column for scoring.
{ {
"messages": [ "messages": [
{"role": "user", "content": "Hello, my name is John Doe."}, {"role": "user", "content": "Hello, my name is John Doe."},