mirror of
https://github.com/meta-llama/llama-stack.git
synced 2026-01-02 13:40:01 +00:00
add DocVQA scoring
This commit is contained in:
parent
ab777ef5cd
commit
74ccc7e26a
6 changed files with 305 additions and 1 deletions
|
|
@ -203,6 +203,19 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
uri="huggingface://datasets/llamastack/bfcl_v3?split=train",
|
||||
),
|
||||
),
|
||||
DatasetInput(
|
||||
dataset_id="docvqa",
|
||||
provider_id="huggingface",
|
||||
url=URL(uri="https://huggingface.co/datasets/llamastack/docvqa"),
|
||||
metadata={
|
||||
"path": "llamastack/docvqa",
|
||||
"split": "train",
|
||||
},
|
||||
dataset_schema={
|
||||
"chat_completion_input": {"type": "string"},
|
||||
"expected_answer": {"type": "string"},
|
||||
},
|
||||
),
|
||||
]
|
||||
|
||||
default_benchmarks = [
|
||||
|
|
@ -231,6 +244,11 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
dataset_id="bfcl",
|
||||
scoring_functions=["basic::bfcl"],
|
||||
),
|
||||
BenchmarkInput(
|
||||
benchmark_id="meta-reference-docvqa",
|
||||
dataset_id="docvqa",
|
||||
scoring_functions=["basic::docvqa"],
|
||||
),
|
||||
]
|
||||
return DistributionTemplate(
|
||||
name=name,
|
||||
|
|
|
|||
|
|
@ -188,6 +188,22 @@ datasets:
|
|||
uri: huggingface://datasets/llamastack/bfcl_v3?split=train
|
||||
metadata: {}
|
||||
dataset_id: bfcl
|
||||
<<<<<<< HEAD
|
||||
=======
|
||||
provider_id: huggingface
|
||||
- dataset_schema:
|
||||
chat_completion_input:
|
||||
type: string
|
||||
expected_answer:
|
||||
type: string
|
||||
url:
|
||||
uri: https://huggingface.co/datasets/llamastack/docvqa
|
||||
metadata:
|
||||
path: llamastack/docvqa
|
||||
split: train
|
||||
dataset_id: docvqa
|
||||
provider_id: huggingface
|
||||
>>>>>>> 81df5a4e (add DocVQA scoring)
|
||||
scoring_fns: []
|
||||
benchmarks:
|
||||
- dataset_id: simpleqa
|
||||
|
|
@ -215,6 +231,11 @@ benchmarks:
|
|||
- basic::bfcl
|
||||
metadata: {}
|
||||
benchmark_id: meta-reference-bfcl
|
||||
- dataset_id: docvqa
|
||||
scoring_functions:
|
||||
- basic::docvqa
|
||||
metadata: {}
|
||||
benchmark_id: meta-reference-docvqa
|
||||
tool_groups:
|
||||
- toolgroup_id: builtin::websearch
|
||||
provider_id: tavily-search
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue