From fb14606ee98e364112d71263ffc3a3364af732df Mon Sep 17 00:00:00 2001 From: F0undLinks <2862323246@qq.com> Date: Thu, 18 Jun 2026 09:39:52 +0800 Subject: [PATCH 1/2] Update cmmlu_gen_5_shot_cot_chat_prompt.py debug --- .../configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py index c5bc0714..22d28514 100644 --- a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py +++ b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py @@ -120,7 +120,8 @@ evaluator=dict(type=AccEvaluator), pred_postprocessor=dict( type=match_answer_pattern, - answer_pattern=r'(?i)答案\s*:\s*[\W]*([A-D])[\W]*', + #answer_pattern=r'(?i)答案\s*:\s*[\W]*([A-D])[\W]*', + answer_pattern=r'(?i)答案\s*[::]\s*[\W]*([A-D])[\W]*', ) ) cmmlu_datasets.append( From 687540c3f998fd2a3976e706fd5b96ed263494fb Mon Sep 17 00:00:00 2001 From: F0undLinks <2862323246@qq.com> Date: Thu, 18 Jun 2026 09:47:31 +0800 Subject: [PATCH 2/2] Update ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com> --- .../configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py | 1 - 1 file changed, 1 deletion(-) diff --git a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py index 22d28514..b5be5f33 100644 --- a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py +++ b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py @@ -120,7 +120,6 @@ evaluator=dict(type=AccEvaluator), pred_postprocessor=dict( type=match_answer_pattern, - #answer_pattern=r'(?i)答案\s*:\s*[\W]*([A-D])[\W]*', answer_pattern=r'(?i)答案\s*[::]\s*[\W]*([A-D])[\W]*', ) )