From 060c7c3b1f16d26283235c746edf7f523a299509 Mon Sep 17 00:00:00 2001 From: KaiMao LEE <361204176@qq.com> Date: Sun, 30 Nov 2025 17:06:39 +0800 Subject: [PATCH] Update accuracy_reward.py MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 原来的编辑距离相似度准确性是错误的,计算的是编辑距离即不相似度。 --- .../tools/reasoning_data_pipeline/utils/accuracy_reward.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/internvl_chat/tools/reasoning_data_pipeline/utils/accuracy_reward.py b/internvl_chat/tools/reasoning_data_pipeline/utils/accuracy_reward.py index 32c0ec0b..e88b1628 100644 --- a/internvl_chat/tools/reasoning_data_pipeline/utils/accuracy_reward.py +++ b/internvl_chat/tools/reasoning_data_pipeline/utils/accuracy_reward.py @@ -512,7 +512,8 @@ def check_answer(answer_pred, answer_gt, mode): det_answer = ' '.join(answer_pred.strip().lower().split()) dist = levenshtein_distance(gt_answer, det_answer) length = max(len(answer_gt.upper()), len(answer_pred.upper())) - accuracy = max(accuracy, float(dist) / float(length)) + similarity = 1 - float(dist) / float(length) + accuracy = max(accuracy, similarity) if 'mc_score' in mode: accuracy = max(accuracy, multi_choice_score(answer_pred, answer_gt))