OpenCompass/opencompass/tasks/base.py
Songyang Zhang fb43dd1906
[Update] Update Skywork/Qwen-QwQ (#1728)
* Update JuderBench

* Support O1-style Prompts

* Update Code

* Update OpenAI

* Update BigCodeBench

* Update BigCodeBench

* Update BigCodeBench

* Update BigCodeBench

* Update BigCodeBench

* Update
2024-12-05 19:30:43 +08:00

120 lines
3.7 KiB
Python

import copy
import os
import re
from abc import abstractmethod
from typing import List, Optional
from mmengine.config import ConfigDict
from opencompass.utils import get_infer_output_path, task_abbr_from_cfg
def extract_role_pred(s: str, begin_str: Optional[str],
end_str: Optional[str]) -> str:
"""Extract the role prediction from the full prediction string. The role
prediction may be the substring between the begin and end string.
Args:
s (str): Full prediction string.
begin_str (str): The beginning string of the role
end_str (str): The ending string of the role.
Returns:
str: The extracted role prediction.
"""
start = 0
end = len(s)
if begin_str and re.match(r'\s*', begin_str) is None:
begin_idx = s.find(begin_str)
if begin_idx != -1:
start = begin_idx + len(begin_str)
if end_str and re.match(r'\s*', end_str) is None:
# TODO: Support calling tokenizer for the accurate eos token
# and avoid such hardcode
end_idx = s.find(end_str, start)
if end_idx != -1:
end = end_idx
return s[start:end]
class BaseTask:
"""Base class for all tasks. There are two ways to run the task:
1. Directly by calling the `run` method.
2. Calling the `get_command` method to get the command,
and then run the command in the shell.
Args:
cfg (ConfigDict): Config dict.
"""
# The prefix of the task name.
name_prefix: str = None
# The subdirectory of the work directory to store the log files.
log_subdir: str = None
# The subdirectory of the work directory to store the output files.
output_subdir: str = None
def __init__(self, cfg: ConfigDict):
cfg = copy.deepcopy(cfg)
self.cfg = cfg
self.model_cfgs = cfg['models']
self.dataset_cfgs = cfg['datasets']
self.work_dir = cfg['work_dir']
@abstractmethod
def run(self):
"""Run the task."""
@abstractmethod
def get_command(self, cfg_path, template) -> str:
"""Get the command template for the task.
Args:
cfg_path (str): The path to the config file of the task.
template (str): The template which have '{task_cmd}' to format
the command.
"""
@property
def name(self) -> str:
return self.name_prefix + task_abbr_from_cfg(
{
'models': self.model_cfgs,
'datasets': self.dataset_cfgs
})
def __repr__(self) -> str:
return f'{self.__class__.__name__}({self.cfg})'
def get_log_path(self, file_extension: str = 'json') -> str:
"""Get the path to the log file.
Args:
file_extension (str): The file extension of the log file.
Default: 'json'.
"""
return get_infer_output_path(
self.model_cfgs[0], self.dataset_cfgs[0][0],
os.path.join(self.work_dir, self.log_subdir), file_extension)
def get_output_paths(self, file_extension: str = 'json') -> List[str]:
"""Get the paths to the output files. Every file should exist if the
task succeeds.
Args:
file_extension (str): The file extension of the output files.
Default: 'json'.
"""
output_paths = []
for model, datasets in zip(self.model_cfgs, self.dataset_cfgs):
for dataset in datasets:
output_paths.append(
get_infer_output_path(
model, dataset,
os.path.join(self.work_dir, self.output_subdir),
file_extension))
return output_paths