mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-30 07:39:38 +00:00
json -> class
This commit is contained in:
parent
0dad0d0d67
commit
e2f6c04e1c
6 changed files with 47 additions and 23 deletions
|
@ -20,6 +20,12 @@ from llama_stack.apis.scoring_functions import * # noqa: F403
|
||||||
from llama_stack.apis.common.type_system import * # noqa: F403
|
from llama_stack.apis.common.type_system import * # noqa: F403
|
||||||
from autoevals.llm import Factuality
|
from autoevals.llm import Factuality
|
||||||
from autoevals.ragas import AnswerCorrectness
|
from autoevals.ragas import AnswerCorrectness
|
||||||
|
from llama_stack.providers.impls.braintrust.scoring.scoring_fn.fn_defs.answer_correctness import (
|
||||||
|
answer_correctness_fn_def,
|
||||||
|
)
|
||||||
|
from llama_stack.providers.impls.braintrust.scoring.scoring_fn.fn_defs.factuality import (
|
||||||
|
factuality_fn_def,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
BRAINTRUST_FN_DEFS_PATH = Path(__file__).parent / "fn_defs"
|
BRAINTRUST_FN_DEFS_PATH = Path(__file__).parent / "fn_defs"
|
||||||
|
@ -36,9 +42,10 @@ class BraintrustScoringFn(BaseScoringFn):
|
||||||
"braintrust::factuality": Factuality(),
|
"braintrust::factuality": Factuality(),
|
||||||
"braintrust::answer-correctness": AnswerCorrectness(),
|
"braintrust::answer-correctness": AnswerCorrectness(),
|
||||||
}
|
}
|
||||||
self.defs_paths = [
|
self.supported_fn_defs_registry = {
|
||||||
str(x) for x in sorted(BRAINTRUST_FN_DEFS_PATH.glob("*.json"))
|
factuality_fn_def.identifier: factuality_fn_def,
|
||||||
]
|
answer_correctness_fn_def.identifier: answer_correctness_fn_def,
|
||||||
|
}
|
||||||
|
|
||||||
async def score_row(
|
async def score_row(
|
||||||
self,
|
self,
|
||||||
|
|
|
@ -0,0 +1,5 @@
|
||||||
|
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
||||||
|
# All rights reserved.
|
||||||
|
#
|
||||||
|
# This source code is licensed under the terms described in the LICENSE file in
|
||||||
|
# the root directory of this source tree.
|
|
@ -1,10 +0,0 @@
|
||||||
{
|
|
||||||
"identifier": "braintrust::answer-correctness",
|
|
||||||
"description": "Test whether an output is factual, compared to an original (`expected`) value. One of Braintrust LLM basd scorer https://github.com/braintrustdata/autoevals/blob/main/py/autoevals/llm.py",
|
|
||||||
"metadata": {},
|
|
||||||
"parameters": [],
|
|
||||||
"return_type": {
|
|
||||||
"type": "number"
|
|
||||||
},
|
|
||||||
"context": null
|
|
||||||
}
|
|
|
@ -0,0 +1,16 @@
|
||||||
|
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
||||||
|
# All rights reserved.
|
||||||
|
#
|
||||||
|
# This source code is licensed under the terms described in the LICENSE file in
|
||||||
|
# the root directory of this source tree.
|
||||||
|
|
||||||
|
from llama_stack.apis.common.type_system import NumberType
|
||||||
|
from llama_stack.apis.scoring_functions import ScoringFnDef
|
||||||
|
|
||||||
|
|
||||||
|
answer_correctness_fn_def = ScoringFnDef(
|
||||||
|
identifier="braintrust::answer-correctness",
|
||||||
|
description="Test whether an output is factual, compared to an original (`expected`) value. One of Braintrust LLM basd scorer https://github.com/braintrustdata/autoevals/blob/main/py/autoevals/llm.py",
|
||||||
|
parameters=[],
|
||||||
|
return_type=NumberType(),
|
||||||
|
)
|
|
@ -1,10 +0,0 @@
|
||||||
{
|
|
||||||
"identifier": "braintrust::factuality",
|
|
||||||
"description": "Test whether an output is factual, compared to an original (`expected`) value. One of Braintrust LLM basd scorer https://github.com/braintrustdata/autoevals/blob/main/py/autoevals/llm.py",
|
|
||||||
"metadata": {},
|
|
||||||
"parameters": [],
|
|
||||||
"return_type": {
|
|
||||||
"type": "number"
|
|
||||||
},
|
|
||||||
"context": null
|
|
||||||
}
|
|
|
@ -0,0 +1,16 @@
|
||||||
|
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
||||||
|
# All rights reserved.
|
||||||
|
#
|
||||||
|
# This source code is licensed under the terms described in the LICENSE file in
|
||||||
|
# the root directory of this source tree.
|
||||||
|
|
||||||
|
from llama_stack.apis.common.type_system import NumberType
|
||||||
|
from llama_stack.apis.scoring_functions import ScoringFnDef
|
||||||
|
|
||||||
|
|
||||||
|
factuality_fn_def = ScoringFnDef(
|
||||||
|
identifier="braintrust::factuality",
|
||||||
|
description="Test whether an output is factual, compared to an original (`expected`) value. One of Braintrust LLM basd scorer https://github.com/braintrustdata/autoevals/blob/main/py/autoevals/llm.py",
|
||||||
|
parameters=[],
|
||||||
|
return_type=NumberType(),
|
||||||
|
)
|
Loading…
Add table
Add a link
Reference in a new issue