diff --git a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py index c5bc0714..b5be5f33 100644 --- a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py +++ b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_5_shot_cot_chat_prompt.py @@ -120,7 +120,7 @@ evaluator=dict(type=AccEvaluator), pred_postprocessor=dict( type=match_answer_pattern, - answer_pattern=r'(?i)答案\s*:\s*[\W]*([A-D])[\W]*', + answer_pattern=r'(?i)答案\s*[::]\s*[\W]*([A-D])[\W]*', ) ) cmmlu_datasets.append(