OpenCompass/opencompass/tasks/base.py

import copy
import os
import re
from abc import abstractmethod
from typing import List, Optional

from mmengine.config import ConfigDict

from opencompass.utils import get_infer_output_path, task_abbr_from_cfg


def extract_role_pred(s: str, begin_str: Optional[str],
                      end_str: Optional[str]) -> str:
    """Extract the role prediction from the full prediction string. The role
    prediction may be the substring between the begin and end string.

    Args:
        s (str): Full prediction string.
        begin_str (str): The beginning string of the role
        end_str (str): The ending string of the role.

    Returns:
        str: The extracted role prediction.
    """
    start = 0
    end = len(s)

    if begin_str and re.match(r'\s*', begin_str) is None:
        begin_idx = s.find(begin_str)
        if begin_idx != -1:
            start = begin_idx + len(begin_str)

    if end_str and re.match(r'\s*', end_str) is None:
        # TODO: Support calling tokenizer for the accurate eos token
        # and avoid such hardcode
        end_idx = s.find(end_str, start)
        if end_idx != -1:
            end = end_idx

    return s[start:end]


class BaseTask:
    """Base class for all tasks. There are two ways to run the task:
    1. Directly by calling the `run` method.
    2. Calling the `get_command` method to get the command,
        and then run the command in the shell.

    Args:
        cfg (ConfigDict): Config dict.
    """

    # The prefix of the task name.
    name_prefix: str = None
    # The subdirectory of the work directory to store the log files.
    log_subdir: str = None
    # The subdirectory of the work directory to store the output files.
    output_subdir: str = None

    def __init__(self, cfg: ConfigDict):
        cfg = copy.deepcopy(cfg)
        self.cfg = cfg
        self.model_cfgs = cfg['models']
        self.dataset_cfgs = cfg['datasets']
        self.work_dir = cfg['work_dir']

    @abstractmethod
    def run(self):
        """Run the task."""

    @abstractmethod
    def get_command(self, cfg_path, template) -> str:
        """Get the command template for the task.

        Args:
            cfg_path (str): The path to the config file of the task.
            template (str): The template which have '{task_cmd}' to format
                the command.
        """

    @property
    def name(self) -> str:
        return self.name_prefix + task_abbr_from_cfg(
            {
                'models': self.model_cfgs,
                'datasets': self.dataset_cfgs
            })

    def __repr__(self) -> str:
        return f'{self.__class__.__name__}({self.cfg})'

    def get_log_path(self, file_extension: str = 'json') -> str:
        """Get the path to the log file.

        Args:
            file_extension (str): The file extension of the log file.
                Default: 'json'.
        """
        return get_infer_output_path(
            self.model_cfgs[0], self.dataset_cfgs[0][0],
            os.path.join(self.work_dir, self.log_subdir), file_extension)

    def get_output_paths(self, file_extension: str = 'json') -> List[str]:
        """Get the paths to the output files. Every file should exist if the
        task succeeds.

        Args:
            file_extension (str): The file extension of the output files.
                Default: 'json'.
        """
        output_paths = []
        for model, datasets in zip(self.model_cfgs, self.dataset_cfgs):
            for dataset in datasets:
                output_paths.append(
                    get_infer_output_path(
                        model, dataset,
                        os.path.join(self.work_dir, self.output_subdir),
                        file_extension))
        return output_paths
[Fix] Use a copy of the config object in Task (#174) 2023-08-09 15:24:49 +08:00			`import copy`
Add release contribution 2023-07-05 10:33:12 +08:00			`import os`
[Update] Update Skywork/Qwen-QwQ (#1728) * Update JuderBench * Support O1-style Prompts * Update Code * Update OpenAI * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update 2024-12-05 19:30:43 +08:00			`import re`
Add release contribution 2023-07-05 10:33:12 +08:00			`from abc import abstractmethod`
[Update] Update Skywork/Qwen-QwQ (#1728) * Update JuderBench * Support O1-style Prompts * Update Code * Update OpenAI * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update 2024-12-05 19:30:43 +08:00			`from typing import List, Optional`
Add release contribution 2023-07-05 10:33:12 +08:00
			`from mmengine.config import ConfigDict`

			`from opencompass.utils import get_infer_output_path, task_abbr_from_cfg`


[Update] Update Skywork/Qwen-QwQ (#1728) * Update JuderBench * Support O1-style Prompts * Update Code * Update OpenAI * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update BigCodeBench * Update 2024-12-05 19:30:43 +08:00			`def extract_role_pred(s: str, begin_str: Optional[str],`
			`end_str: Optional[str]) -> str:`
			`"""Extract the role prediction from the full prediction string. The role`
			`prediction may be the substring between the begin and end string.`

			`Args:`
			`s (str): Full prediction string.`
			`begin_str (str): The beginning string of the role`
			`end_str (str): The ending string of the role.`

			`Returns:`
			`str: The extracted role prediction.`
			`"""`
			`start = 0`
			`end = len(s)`

			`if begin_str and re.match(r'\s*', begin_str) is None:`
			`begin_idx = s.find(begin_str)`
			`if begin_idx != -1:`
			`start = begin_idx + len(begin_str)`

			`if end_str and re.match(r'\s*', end_str) is None:`
			`# TODO: Support calling tokenizer for the accurate eos token`
			`# and avoid such hardcode`
			`end_idx = s.find(end_str, start)`
			`if end_idx != -1:`
			`end = end_idx`

			`return s[start:end]`


Add release contribution 2023-07-05 10:33:12 +08:00			`class BaseTask:`
			`"""Base class for all tasks. There are two ways to run the task:`
			1. Directly by calling the `run` method.
Auto re-generate port number during retry (#24) * Auto re-generate port number during retry * Fix slurm command 2023-07-07 17:25:56 +08:00			2. Calling the `get_command` method to get the command,
Add release contribution 2023-07-05 10:33:12 +08:00			`and then run the command in the shell.`

			`Args:`
			`cfg (ConfigDict): Config dict.`
			`"""`

			`# The prefix of the task name.`
			`name_prefix: str = None`
			`# The subdirectory of the work directory to store the log files.`
			`log_subdir: str = None`
			`# The subdirectory of the work directory to store the output files.`
			`output_subdir: str = None`

			`def __init__(self, cfg: ConfigDict):`
[Fix] Use a copy of the config object in Task (#174) 2023-08-09 15:24:49 +08:00			`cfg = copy.deepcopy(cfg)`
Add release contribution 2023-07-05 10:33:12 +08:00			`self.cfg = cfg`
			`self.model_cfgs = cfg['models']`
			`self.dataset_cfgs = cfg['datasets']`
			`self.work_dir = cfg['work_dir']`

			`@abstractmethod`
			`def run(self):`
			`"""Run the task."""`

			`@abstractmethod`
Auto re-generate port number during retry (#24) * Auto re-generate port number during retry * Fix slurm command 2023-07-07 17:25:56 +08:00			`def get_command(self, cfg_path, template) -> str:`
Add release contribution 2023-07-05 10:33:12 +08:00			`"""Get the command template for the task.`

Auto re-generate port number during retry (#24) * Auto re-generate port number during retry * Fix slurm command 2023-07-07 17:25:56 +08:00			`Args:`
			`cfg_path (str): The path to the config file of the task.`
			`template (str): The template which have '{task_cmd}' to format`
			`the command.`
Add release contribution 2023-07-05 10:33:12 +08:00			`"""`

			`@property`
			`def name(self) -> str:`
			`return self.name_prefix + task_abbr_from_cfg(`
			`{`
			`'models': self.model_cfgs,`
			`'datasets': self.dataset_cfgs`
			`})`

			`def __repr__(self) -> str:`
			`return f'{self.__class__.__name__}({self.cfg})'`

			`def get_log_path(self, file_extension: str = 'json') -> str:`
			`"""Get the path to the log file.`

			`Args:`
			`file_extension (str): The file extension of the log file.`
			`Default: 'json'.`
			`"""`
			`return get_infer_output_path(`
			`self.model_cfgs[0], self.dataset_cfgs[0][0],`
			`os.path.join(self.work_dir, self.log_subdir), file_extension)`

			`def get_output_paths(self, file_extension: str = 'json') -> List[str]:`
			`"""Get the paths to the output files. Every file should exist if the`
			`task succeeds.`

			`Args:`
			`file_extension (str): The file extension of the output files.`
			`Default: 'json'.`
			`"""`
			`output_paths = []`
			`for model, datasets in zip(self.model_cfgs, self.dataset_cfgs):`
			`for dataset in datasets:`
			`output_paths.append(`
			`get_infer_output_path(`
			`model, dataset,`
			`os.path.join(self.work_dir, self.output_subdir),`
			`file_extension))`
			`return output_paths`