llm judge llamastack scorer

This commit is contained in:
Xi Yan 2024-10-15 13:25:46 -07:00
parent 0c4ed66ecc
commit fa68809a2e
10 changed files with 199 additions and 7 deletions

View file

@ -13,6 +13,7 @@ GeneratorProcessorRegistry = Registry[BaseGeneratorProcessor]()
PROCESSOR_REGISTRY = {
"mmlu": MMLUProcessor,
"judge": JudgeProcessor,
}
for k, v in PROCESSOR_REGISTRY.items():

View file

@ -7,6 +7,7 @@
from llama_stack.apis.evals import * # noqa: F403
from llama_stack.providers.impls.meta_reference.evals.scorer.basic_scorers import * # noqa: F403
from llama_stack.providers.impls.meta_reference.evals.scorer.braintrust_scorer import * # noqa: F403
from llama_stack.providers.impls.meta_reference.evals.scorer.llm_judge_scorer import * # noqa: F403
from ..registry import Registry
@ -16,6 +17,7 @@ ScorerRegistry = Registry[BaseScorer]()
SCORER_REGISTRY = {
"accuracy": AccuracyScorer,
"random": RandomScorer,
"llamastack-llm-judge": LlamaStackLLMJudgeScorer,
"braintrust::factuality": BraintrustFactualityScorer,
"braintrust::answer-correctness": BraintrustAnswerCorrectnessScorer,
}