delete preregistered dataset/eval task

2025-12-16 01:12:37 +00:00 · 2024-11-11 11:05:47 -05:00 · 2024-11-11 11:05:47 -05:00 · 9ff903e63b
commit 9ff903e63b
parent 8bebe3fd1f
5 changed files with 4 additions and 64 deletions
--- a/llama_stack/providers/adapters/datasetio/huggingface/benchmarks/init.py
+++ b/llama_stack/providers/adapters/datasetio/huggingface/benchmarks/init.py
@ -1,12 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-
-# # Copyright (c) Meta Platforms, Inc. and affiliates.
-# # All rights reserved.
-# #
-# # This source code is licensed under the terms described in the LICENSE file in
-# # the root directory of this source tree.
-# from .mmlu import mmlu  # noqa: F401
--- a/llama_stack/providers/adapters/datasetio/huggingface/benchmarks/mmlu.py
+++ b/llama_stack/providers/adapters/datasetio/huggingface/benchmarks/mmlu.py
@ -1,30 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-
-# # Copyright (c) Meta Platforms, Inc. and affiliates.
-# # All rights reserved.
-# #
-# # This source code is licensed under the terms described in the LICENSE file in
-# # the root directory of this source tree.
-
-# from llama_models.llama3.api.datatypes import URL
-# from llama_stack.apis.common.type_system import ChatCompletionInputType, StringType
-# from llama_stack.apis.datasetio import DatasetDef
-
-# mmlu = DatasetDef(
-#     identifier="mmlu",
-#     url=URL(uri="https://huggingface.co/datasets/llamastack/evals"),
-#     dataset_schema={
-#         "input_query": StringType(),
-#         "expected_answer": StringType(),
-#         "chat_completion_input": ChatCompletionInputType(),
-#     },
-#     metadata={
-#         "path": "llamastack/evals",
-#         "name": "evals__mmlu__details",
-#         "split": "train",
-#     },
-# )
--- a/llama_stack/providers/inline/meta_reference/eval/eval.py
+++ b/llama_stack/providers/inline/meta_reference/eval/eval.py
@ -19,7 +19,6 @@ from llama_stack.apis.scoring import Scoring
 from llama_stack.providers.datatypes import EvalTasksProtocolPrivate

 from .config import MetaReferenceEvalConfig
-from .eval_task_defs.meta_reference_mmlu import meta_reference_mmlu


 class ColumnName(Enum):
@ -51,9 +50,10 @@ class MetaReferenceEvalImpl(Eval, EvalTasksProtocolPrivate):
        self.eval_tasks = {}

    async def initialize(self) -> None:
-        # pre-register eval tasks
-        benchmark_tasks = [meta_reference_mmlu]
-        self.eval_tasks = {x.identifier: x for x in benchmark_tasks}
+        pass
+        # # pre-register eval tasks
+        # benchmark_tasks = [meta_reference_mmlu]
+        # self.eval_tasks = {x.identifier: x for x in benchmark_tasks}

    async def shutdown(self) -> None: ...

--- a/llama_stack/providers/inline/meta_reference/eval/eval_task_defs/init.py
+++ b/llama_stack/providers/inline/meta_reference/eval/eval_task_defs/init.py
@ -1,5 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
--- a/llama_stack/providers/inline/meta_reference/eval/eval_task_defs/meta_reference_mmlu.py
+++ b/llama_stack/providers/inline/meta_reference/eval/eval_task_defs/meta_reference_mmlu.py
@ -1,13 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-
-from llama_stack.apis.eval import EvalTaskDef
-
-meta_reference_mmlu = EvalTaskDef(
-    identifier="meta-reference-mmlu",
-    dataset_id="mmlu",
-    scoring_functions=["meta-reference::regex_parser_multiple_choice_answer"],
-)