rebase onto new dataset schema

This commit is contained in:
Yang Yang 2025-03-18 10:40:41 -07:00
parent dd75008a44
commit a550f17128
2 changed files with 9 additions and 19 deletions

View file

@ -206,15 +206,10 @@ def get_distribution_template() -> DistributionTemplate:
DatasetInput(
dataset_id="docvqa",
provider_id="huggingface",
url=URL(uri="https://huggingface.co/datasets/llamastack/docvqa"),
metadata={
"path": "llamastack/docvqa",
"split": "val",
},
dataset_schema={
"chat_completion_input": {"type": "string"},
"expected_answer": {"type": "string"},
},
purpose=DatasetPurpose.eval_messages_answer,
source=URIDataSource(
uri="huggingface://datasets/llamastack/docvqa?split=val",
),
),
]

View file

@ -191,16 +191,11 @@ datasets:
<<<<<<< HEAD
=======
provider_id: huggingface
- dataset_schema:
chat_completion_input:
type: string
expected_answer:
type: string
url:
uri: https://huggingface.co/datasets/llamastack/docvqa
metadata:
path: llamastack/docvqa
split: val
- purpose: eval/messages-answer
source:
type: uri
uri: huggingface://datasets/llamastack/docvqa?split=val
metadata: {}
dataset_id: docvqa
provider_id: huggingface
>>>>>>> 81df5a4e (add DocVQA scoring)