From 5ec1881c852aca9d7f05785623fda294f1c7bcab Mon Sep 17 00:00:00 2001 From: Yang Yang Date: Wed, 12 Mar 2025 11:49:57 -0700 Subject: [PATCH] prepare for autogen llama_stack/templates/open-benchmark/run.yaml instead --- .../open-benchmark/open_benchmark.py | 21 +++++++++++++++++++ 1 file changed, 21 insertions(+) diff --git a/llama_stack/templates/open-benchmark/open_benchmark.py b/llama_stack/templates/open-benchmark/open_benchmark.py index 2b40797f9..b78418d55 100644 --- a/llama_stack/templates/open-benchmark/open_benchmark.py +++ b/llama_stack/templates/open-benchmark/open_benchmark.py @@ -226,6 +226,22 @@ def get_distribution_template() -> DistributionTemplate: "chat_completion_input": {"type": "string"}, }, ), + DatasetInput( + dataset_id="bfcl", + provider_id="huggingface", + url={"uri": "https://huggingface.co/datasets/llamastack/bfcl_v3"}, + metadata={ + "path": "llamastack/bfcl_v3", + "split": "train", + }, + dataset_schema={ + "function": {"type": "string"}, + "language": {"type": "string"}, + "ground_truth": {"type": "string"}, + "id": {"type": "string"}, + "chat_completion_input": {"type": "string"}, + }, + ), ] default_benchmarks = [ @@ -249,6 +265,11 @@ def get_distribution_template() -> DistributionTemplate: dataset_id="math_500", scoring_functions=["basic::regex_parser_math_response"], ), + BenchmarkInput( + benchmark_id="meta-reference-bfcl", + dataset_id="bfcl", + scoring_functions=["basic::bfcl"], + ), ] return DistributionTemplate( name=name,