diff --git a/llama_stack/providers/inline/scoring/basic/scoring_fn/docvqa_scoring_fn.py b/llama_stack/providers/inline/scoring/basic/scoring_fn/docvqa_scoring_fn.py index 937580d71..9f7b99879 100644 --- a/llama_stack/providers/inline/scoring/basic/scoring_fn/docvqa_scoring_fn.py +++ b/llama_stack/providers/inline/scoring/basic/scoring_fn/docvqa_scoring_fn.py @@ -235,7 +235,7 @@ class DocVQAScoringFn(RegisteredBaseScoringFn): print("SCORE_ROW ======") print(input_row) expected_answers = json.loads(input_row["expected_answer"]) - generated_answer = input_row["generated_answer"].text + generated_answer = input_row["generated_answer"] score = 1.0 if normalize_answer(generated_answer) in [normalize_answer(s) for s in expected_answers] else 0.0 return { "score": score,