diff --git a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_0_shot_cot_chat_prompt.py b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_0_shot_cot_chat_prompt.py index 9ee0996c..aabbe360 100644 --- a/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_0_shot_cot_chat_prompt.py +++ b/ais_bench/benchmark/configs/datasets/cmmlu/cmmlu_gen_0_shot_cot_chat_prompt.py @@ -108,7 +108,7 @@ evaluator=dict(type=AccEvaluator), pred_postprocessor=dict( type=match_answer_pattern, - answer_pattern=r'(?i)答案\s*:\s*[\W]*([A-D])[\W]*', + answer_pattern=r'(?i)答案\s*[::]\s*[\W]*([A-D])[\W]*', ) ) cmmlu_datasets.append(