mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-15 23:59:26 +00:00
llm judge llamastack scorer
This commit is contained in:
parent
0c4ed66ecc
commit
fa68809a2e
10 changed files with 199 additions and 7 deletions
|
|
@ -13,6 +13,7 @@ GeneratorProcessorRegistry = Registry[BaseGeneratorProcessor]()
|
|||
|
||||
PROCESSOR_REGISTRY = {
|
||||
"mmlu": MMLUProcessor,
|
||||
"judge": JudgeProcessor,
|
||||
}
|
||||
|
||||
for k, v in PROCESSOR_REGISTRY.items():
|
||||
|
|
|
|||
|
|
@ -7,6 +7,7 @@
|
|||
from llama_stack.apis.evals import * # noqa: F403
|
||||
from llama_stack.providers.impls.meta_reference.evals.scorer.basic_scorers import * # noqa: F403
|
||||
from llama_stack.providers.impls.meta_reference.evals.scorer.braintrust_scorer import * # noqa: F403
|
||||
from llama_stack.providers.impls.meta_reference.evals.scorer.llm_judge_scorer import * # noqa: F403
|
||||
|
||||
from ..registry import Registry
|
||||
|
||||
|
|
@ -16,6 +17,7 @@ ScorerRegistry = Registry[BaseScorer]()
|
|||
SCORER_REGISTRY = {
|
||||
"accuracy": AccuracyScorer,
|
||||
"random": RandomScorer,
|
||||
"llamastack-llm-judge": LlamaStackLLMJudgeScorer,
|
||||
"braintrust::factuality": BraintrustFactualityScorer,
|
||||
"braintrust::answer-correctness": BraintrustAnswerCorrectnessScorer,
|
||||
}
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue