OpenCompass/opencompass/datasets/calm/evaluation/error/basic_adversarial/CLADDER.py
Peng Bo 07c96ac659
Calm dataset (#1385)
* Add CALM Dataset
2024-08-01 10:03:21 +08:00

44 lines
1.0 KiB
Python

import re
def check_standalization(model_response, prompt_style, type):
if model_response.startswith(('no', '', 'yes', '')):
return 0
else:
return 1
def check_empty(model_response):
if model_response == '':
return 1
else:
return 0
def check_repetition(model_response):
if any(response in model_response for response in
['answer (yes or no ?)', 'input info', '输入信息:', '答案(是或否?)']):
return 1
else:
return 0
def contains_chinese(text):
chinese_pattern = re.compile(r'[\u4e00-\u9fff]+')
result = 1 if chinese_pattern.search(text) is not None else 0
return result
def contains_english(text):
english_pattern = re.compile(r'[A-Za-z]{2,}')
result = 1 if english_pattern.search(text) is not None else 0
return result
def check_abnormality(preds):
abnormalities = 'All Yes' if all(pred == 1 for pred in preds) else \
'All No' if all(pred == 0 for pred in preds) else 0
return abnormalities