fix lint

2025-05-30 16:03:24 +08:00 · 2025-05-08 11:12:17 +00:00 · 2025-05-08 11:12:17 +00:00 · 724472ee5d
commit 724472ee5d
parent b9aa1c17f7
2 changed files with 13 additions and 15 deletions
--- a/opencompass/configs/datasets/MedCalc_Bench/MedCalcBench_official_gen_a5155f.py
+++ b/opencompass/configs/datasets/MedCalc_Bench/MedCalcBench_official_gen_a5155f.py
@ -4,7 +4,6 @@ from opencompass.openicl.icl_prompt_template import PromptTemplate
 from opencompass.openicl.icl_retriever import ZeroRetriever
 ZERO_SHOT_PROMPT = 'You are a helpful assistant for calculating a score for a given patient note. Please think step-by-step to solve the question and then generate the required score. Your output should only contain a JSON dict formatted as {"step_by_step_thinking": str(your_step_by_step_thinking_procress_to_solve_the_question), "answer": str(short_and_direct_answer_of_the_question)}. \n Here is the patient note:\n{patient_note}\n\nHere is the task:\n{question}\n\nPlease directly output the JSON dict formatted as {"step_by_step_thinking": str(your_step_by_step_thinking_procress_to_solve_the_question), "answer": str(short_and_direct_answer_of_the_question)}:'
 # Reader configuration
 reader_cfg = dict(
        input_columns=[
--- a/opencompass/datasets/MedCalc_Bench.py
+++ b/opencompass/datasets/MedCalc_Bench.py
@ -1,16 +1,12 @@
 import argparse
 import math
 import os
 import re
 from datetime import datetime
 import numpy as np
-import pandas as pd
+from datasets import load_dataset
 from datasets import Dataset, load_dataset
 from opencompass.openicl import BaseEvaluator
-from opencompass.registry import LOAD_DATASET, TEXT_POSTPROCESSORS
+from opencompass.registry import LOAD_DATASET
 from opencompass.utils import get_logger
 from .base import BaseDataset
 """
@ -97,7 +93,13 @@ def extract_answer(answer, calid):
        extracted_answer = 'Not Found'
    else:
        extracted_answer = extracted_answer[-1].strip().strip('"')
-        if extracted_answer == 'str(short_and_direct_answer_of_the_question)' or extracted_answer == 'str(value which is the answer to the question)' or extracted_answer == 'X.XX':
+        if extracted_answer == 'str(short_and_direct\
                _answer_of_the_question)':
            extracted_answer = 'Not Found'
        if extracted_answer == 'str(value which is\
                the answer to the question)':
            extracted_answer = 'Not Found'
        if extracted_answer == 'X.XX':
            extracted_answer = 'Not Found'
    if calid in [13, 68]:
@ -116,9 +118,8 @@ def extract_answer(answer, calid):
    elif calid in [69]:
        # Output Type: integer (A, B)
        match = re.search(
-            r"\(?[\"\']?(\d+)\s*(weeks?)?[\"\']?,?\s*[\"\']?(\d+)\s*(days?)?[\"\']?\s*\)?",
+            r"\(?[\"\']?(\d+)\s*(weeks?)?[\"\']?,\?\s*[\"\']?(\d+)\s*(days?)?[\"\']?\s*\)?",
            extracted_answer)
        ground_truth = f'({match.group(1)}, {match.group(3)})'
        extracted_answer = extracted_answer.replace('[', '(').replace(
            ']', ')').replace("'", '').replace('"', '')
        match = re.search(
@ -157,7 +158,7 @@ def extract_answer(answer, calid):
    ]:
        # Output Type: decimal
        match = re.search(r'str\((.*)\)', extracted_answer)
-        if match:  # cases like "str(round((140 * (3.15 - 136) / 1400) * 72.36)"
+        if match:
            expression = match.group(1).replace('^', '**').replace(
                'is odd', '% 2 == 1').replace('is even', '% 2 == 0').replace(
                    'sqrt', 'math.sqrt').replace('.math', '').replace(
@ -166,9 +167,7 @@ def extract_answer(answer, calid):
                            'g/dl', '').replace('mmol/L', '').replace(
                                'kg', '').replace('g',
                                                  '').replace('mEq/L', '')
-            expression = expression.split(
+            expression = expression.split('#')[0]
                '#'
            )[0]  # cases like round(45.5 * 166 - 45.3 + 0.4 * (75 - (45.5 * 166 - 45.3))))) # Calculation: ...
            if expression.count('(') > expression.count(')'):  # add missing ')
                expression += ')' * (expression.count('(') -
                                     expression.count(')'))
@ -188,7 +187,7 @@ def extract_answer(answer, calid):
                    'np': np,
                    'numpy': np
                })
-            except:
+            except Exception:
                print(f'Error in evaluating expression: {expression}')
                answer = 'N/A'
        else: