OpenCompass/opencompass/utils/run.py

import os
from typing import List, Union

import tabulate
from mmengine.config import Config

from opencompass.datasets.custom import make_custom_dataset_config
from opencompass.models import VLLM, HuggingFaceCausalLM, TurboMindModel
from opencompass.partitioners import NaivePartitioner, SizePartitioner
from opencompass.runners import DLCRunner, LocalRunner, SlurmRunner
from opencompass.tasks import OpenICLEvalTask, OpenICLInferTask
from opencompass.utils import get_logger, match_files


def match_cfg_file(workdir: str, pattern: Union[str, List[str]]) -> List[str]:
    """Match the config file in workdir recursively given the pattern.

    Additionally, if the pattern itself points to an existing file, it will be
    directly returned.
    """
    if isinstance(pattern, str):
        pattern = [pattern]
    pattern = [p + '.py' if not p.endswith('.py') else p for p in pattern]
    files = match_files(workdir, pattern, fuzzy=False)
    if len(files) != len(pattern):
        nomatched = []
        ambiguous = []
        err_msg = ('The provided pattern matches 0 or more than one '
                   'config. Please verify your pattern and try again. '
                   'You may use tools/list_configs.py to list or '
                   'locate the configurations.\n')
        for p in pattern:
            files = match_files(workdir, p, fuzzy=False)
            if len(files) == 0:
                nomatched.append([p[:-3]])
            elif len(files) > 1:
                ambiguous.append([p[:-3], '\n'.join(f[1] for f in files)])
        if nomatched:
            table = [['Not matched patterns'], *nomatched]
            err_msg += tabulate.tabulate(table,
                                         headers='firstrow',
                                         tablefmt='psql')
        if ambiguous:
            table = [['Ambiguous patterns', 'Matched files'], *ambiguous]
            err_msg += tabulate.tabulate(table,
                                         headers='firstrow',
                                         tablefmt='psql')
        raise ValueError(err_msg)
    return files


def try_fill_in_custom_cfgs(config):
    for i, dataset in enumerate(config['datasets']):
        if 'type' not in dataset:
            config['datasets'][i] = make_custom_dataset_config(dataset)
    if 'model_dataset_combinations' not in config:
        return config
    for mdc in config['model_dataset_combinations']:
        for i, dataset in enumerate(mdc['datasets']):
            if 'type' not in dataset:
                mdc['datasets'][i] = make_custom_dataset_config(dataset)
    return config


def get_config_from_arg(args) -> Config:
    """Get the config object given args.

    Only a few argument combinations are accepted (priority from high to low)
    1. args.config
    2. args.models and args.datasets
    3. Huggingface parameter groups and args.datasets
    """
    if args.config:
        config = Config.fromfile(args.config, format_python_code=False)
        config = try_fill_in_custom_cfgs(config)
        # set infer accelerator if needed
        if args.accelerator in ['vllm', 'lmdeploy']:
            config['models'] = change_accelerator(config['models'],
                                                  args.accelerator)
            if 'eval' in config and 'partitioner' in config['eval']:
                if 'models' in config['eval']['partitioner']:
                    config['eval']['partitioner'][
                        'models'] = change_accelerator(
                            config['eval']['partitioner']['models'],
                            args.accelerator)
                if 'judge_models' in config['eval']['partitioner']:
                    config['eval']['partitioner'][
                        'judge_models'] = change_accelerator(
                            config['eval']['partitioner']['judge_models'],
                            args.accelerator)
        return config
    # parse dataset args
    if not args.datasets and not args.custom_dataset_path:
        raise ValueError('You must specify "--datasets" or '
                         '"--custom-dataset-path" if you do not specify a '
                         'config file path.')
    datasets = []
    if args.datasets:
        datasets_dir = os.path.join(args.config_dir, 'datasets')
        for dataset_arg in args.datasets:
            if '/' in dataset_arg:
                dataset_name, dataset_suffix = dataset_arg.split('/', 1)
                dataset_key_suffix = dataset_suffix
            else:
                dataset_name = dataset_arg
                dataset_key_suffix = '_datasets'

            for dataset in match_cfg_file(datasets_dir, [dataset_name]):
                get_logger().info(f'Loading {dataset[0]}: {dataset[1]}')
                cfg = Config.fromfile(dataset[1])
                for k in cfg.keys():
                    if k.endswith(dataset_key_suffix):
                        datasets += cfg[k]
    else:
        dataset = {'path': args.custom_dataset_path}
        if args.custom_dataset_infer_method is not None:
            dataset['infer_method'] = args.custom_dataset_infer_method
        if args.custom_dataset_data_type is not None:
            dataset['data_type'] = args.custom_dataset_data_type
        if args.custom_dataset_meta_path is not None:
            dataset['meta_path'] = args.custom_dataset_meta_path
        dataset = make_custom_dataset_config(dataset)
        datasets.append(dataset)

    # parse model args
    if not args.models and not args.hf_path:
        raise ValueError('You must specify a config file path, '
                         'or specify --models and --datasets, or '
                         'specify HuggingFace model parameters and '
                         '--datasets.')
    models = []
    if args.models:
        model_dir = os.path.join(args.config_dir, 'models')
        for model in match_cfg_file(model_dir, args.models):
            get_logger().info(f'Loading {model[0]}: {model[1]}')
            cfg = Config.fromfile(model[1])
            if 'models' not in cfg:
                raise ValueError(
                    f'Config file {model[1]} does not contain "models" field')
            models += cfg['models']
    else:
        from opencompass.models import HuggingFace
        model = dict(type=f'{HuggingFace.__module__}.{HuggingFace.__name__}',
                     path=args.hf_path,
                     peft_path=args.peft_path,
                     tokenizer_path=args.tokenizer_path,
                     model_kwargs=args.model_kwargs,
                     tokenizer_kwargs=args.tokenizer_kwargs,
                     max_seq_len=args.max_seq_len,
                     max_out_len=args.max_out_len,
                     batch_padding=not args.no_batch_padding,
                     batch_size=args.batch_size,
                     pad_token_id=args.pad_token_id,
                     run_cfg=dict(num_gpus=args.num_gpus))
        models.append(model)
    # set infer accelerator if needed
    if args.accelerator in ['vllm', 'lmdeploy']:
        models = change_accelerator(models, args.accelerator)
    # parse summarizer args
    summarizer_arg = args.summarizer if args.summarizer is not None \
        else 'example'
    summarizers_dir = os.path.join(args.config_dir, 'summarizers')

    # Check if summarizer_arg contains '/'
    if '/' in summarizer_arg:
        # If it contains '/', split the string by '/'
        # and use the second part as the configuration key
        summarizer_file, summarizer_key = summarizer_arg.split('/', 1)
    else:
        # If it does not contain '/', keep the original logic unchanged
        summarizer_key = 'summarizer'
        summarizer_file = summarizer_arg

    s = match_cfg_file(summarizers_dir, [summarizer_file])[0]
    get_logger().info(f'Loading {s[0]}: {s[1]}')
    cfg = Config.fromfile(s[1])
    # Use summarizer_key to retrieve the summarizer definition
    # from the configuration file
    summarizer = cfg[summarizer_key]

    return Config(dict(models=models, datasets=datasets,
                       summarizer=summarizer),
                  format_python_code=False)


def change_accelerator(models, accelerator):
    models = models.copy()
    model_accels = []
    for model in models:
        get_logger().info(f'Transforming {model["abbr"]} to {accelerator}')
        # change HuggingFace model to VLLM or TurboMindModel
        if model['type'] is HuggingFaceCausalLM:
            gen_args = dict()
            if model.get('generation_kwargs') is not None:
                generation_kwargs = model['generation_kwargs'].copy()
                gen_args['temperature'] = 0.001 if generation_kwargs.get(
                    'temperature'
                ) is None else generation_kwargs['temperature']
                gen_args['top_k'] = 1 if generation_kwargs.get(
                    'top_k') is None else generation_kwargs['top_k']
                gen_args['top_p'] = 0.9 if generation_kwargs.get(
                    'top_p') is None else generation_kwargs['top_p']
                gen_args['stop_token_ids'] = None if generation_kwargs.get(
                    'eos_token_id'
                ) is None else generation_kwargs['eos_token_id']
                generation_kwargs[
                    'stop_token_ids'] = None if generation_kwargs.get(
                        'eos_token_id'
                    ) is None else generation_kwargs['eos_token_id']
                generation_kwargs.pop('eos_token_id')
            else:
                # if generation_kwargs is not provided, set default values
                generation_kwargs = dict()
                gen_args['temperature'] = 0.0
                gen_args['top_k'] = 1
                gen_args['top_p'] = 0.9
                gen_args['stop_token_ids'] = None

            if accelerator == 'lmdeploy':
                get_logger().info(
                    f'Transforming {model["abbr"]} to {accelerator}')
                model = dict(
                    type=  # noqa E251
                    f'{TurboMindModel.__module__}.{TurboMindModel.__name__}',
                    abbr=model['abbr'].replace('hf', 'lmdeploy')
                    if '-hf' in model['abbr'] else model['abbr'] + '-lmdeploy',
                    path=model['path'],
                    engine_config=dict(session_len=model['max_seq_len'],
                                       max_batch_size=model['batch_size'],
                                       tp=model['run_cfg']['num_gpus']),
                    gen_config=dict(top_k=gen_args['top_k'],
                                    temperature=gen_args['temperature'],
                                    top_p=gen_args['top_p'],
                                    max_new_tokens=model['max_out_len'],
                                    stop_words=gen_args['stop_token_ids']),
                    max_out_len=model['max_out_len'],
                    max_seq_len=model['max_seq_len'],
                    batch_size=model['batch_size'],
                    concurrency=model['batch_size'],
                    run_cfg=model['run_cfg'],
                )
                for item in ['meta_template']:
                    if model.get(item) is not None:
                        model.update(item, model[item])
            elif accelerator == 'vllm':
                get_logger().info(
                    f'Transforming {model["abbr"]} to {accelerator}')

                model = dict(
                    type=f'{VLLM.__module__}.{VLLM.__name__}',
                    abbr=model['abbr'].replace('hf', 'vllm')
                    if '-hf' in model['abbr'] else model['abbr'] + '-vllm',
                    path=model['path'],
                    model_kwargs=dict(
                        tensor_parallel_size=model['run_cfg']['num_gpus']),
                    max_out_len=model['max_out_len'],
                    max_seq_len=model['max_seq_len'],
                    batch_size=model['batch_size'],
                    generation_kwargs=generation_kwargs,
                    run_cfg=model['run_cfg'],
                )
                for item in ['meta_template', 'end_str']:
                    if model.get(item) is not None:
                        model.update(item, model[item])
                generation_kwargs.update(
                    dict(temperature=gen_args['temperature']))
            else:
                raise ValueError(f'Unsupported accelerator {accelerator}')
        model_accels.append(model)
    return model_accels


def get_config_type(obj) -> str:
    return f'{obj.__module__}.{obj.__name__}'


def fill_infer_cfg(cfg, args):
    new_cfg = dict(infer=dict(
        partitioner=dict(type=get_config_type(SizePartitioner),
                         max_task_size=args.max_partition_size,
                         gen_task_coef=args.gen_task_coef),
        runner=dict(
            max_num_workers=args.max_num_workers,
            debug=args.debug,
            task=dict(type=get_config_type(OpenICLInferTask)),
            lark_bot_url=cfg['lark_bot_url'],
        )), )
    if args.slurm:
        new_cfg['infer']['runner']['type'] = get_config_type(SlurmRunner)
        new_cfg['infer']['runner']['partition'] = args.partition
        new_cfg['infer']['runner']['quotatype'] = args.quotatype
        new_cfg['infer']['runner']['qos'] = args.qos
        new_cfg['infer']['runner']['retry'] = args.retry
    elif args.dlc:
        new_cfg['infer']['runner']['type'] = get_config_type(DLCRunner)
        new_cfg['infer']['runner']['aliyun_cfg'] = Config.fromfile(
            args.aliyun_cfg)
        new_cfg['infer']['runner']['retry'] = args.retry
    else:
        new_cfg['infer']['runner']['type'] = get_config_type(LocalRunner)
        new_cfg['infer']['runner'][
            'max_workers_per_gpu'] = args.max_workers_per_gpu
    cfg.merge_from_dict(new_cfg)


def fill_eval_cfg(cfg, args):
    new_cfg = dict(
        eval=dict(partitioner=dict(type=get_config_type(NaivePartitioner)),
                  runner=dict(
                      max_num_workers=args.max_num_workers,
                      debug=args.debug,
                      task=dict(type=get_config_type(OpenICLEvalTask)),
                      lark_bot_url=cfg['lark_bot_url'],
                  )))
    if args.slurm:
        new_cfg['eval']['runner']['type'] = get_config_type(SlurmRunner)
        new_cfg['eval']['runner']['partition'] = args.partition
        new_cfg['eval']['runner']['quotatype'] = args.quotatype
        new_cfg['eval']['runner']['qos'] = args.qos
        new_cfg['eval']['runner']['retry'] = args.retry
    elif args.dlc:
        new_cfg['eval']['runner']['type'] = get_config_type(DLCRunner)
        new_cfg['eval']['runner']['aliyun_cfg'] = Config.fromfile(
            args.aliyun_cfg)
        new_cfg['eval']['runner']['retry'] = args.retry
    else:
        new_cfg['eval']['runner']['type'] = get_config_type(LocalRunner)
        new_cfg['eval']['runner'][
            'max_workers_per_gpu'] = args.max_workers_per_gpu
    cfg.merge_from_dict(new_cfg)
[Feature] support customize config path (#423) * support customize config path * support customize config path * support customize config path 2023-09-22 19:12:02 +08:00			`import os`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`from typing import List, Union`

			`import tabulate`
			`from mmengine.config import Config`

[Sync] update configs (#734) 2023-12-25 21:59:16 +08:00			`from opencompass.datasets.custom import make_custom_dataset_config`
[Sync] deprecate old mbpps (#1064) 2024-04-19 20:49:46 +08:00			`from opencompass.models import VLLM, HuggingFaceCausalLM, TurboMindModel`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`from opencompass.partitioners import NaivePartitioner, SizePartitioner`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`from opencompass.runners import DLCRunner, LocalRunner, SlurmRunner`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`from opencompass.tasks import OpenICLEvalTask, OpenICLInferTask`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`from opencompass.utils import get_logger, match_files`


			`def match_cfg_file(workdir: str, pattern: Union[str, List[str]]) -> List[str]:`
			`"""Match the config file in workdir recursively given the pattern.`

			`Additionally, if the pattern itself points to an existing file, it will be`
			`directly returned.`
			`"""`
			`if isinstance(pattern, str):`
			`pattern = [pattern]`
			`pattern = [p + '.py' if not p.endswith('.py') else p for p in pattern]`
			`files = match_files(workdir, pattern, fuzzy=False)`
			`if len(files) != len(pattern):`
			`nomatched = []`
			`ambiguous = []`
			`err_msg = ('The provided pattern matches 0 or more than one '`
			`'config. Please verify your pattern and try again. '`
			`'You may use tools/list_configs.py to list or '`
			`'locate the configurations.\n')`
			`for p in pattern:`
			`files = match_files(workdir, p, fuzzy=False)`
			`if len(files) == 0:`
			`nomatched.append([p[:-3]])`
			`elif len(files) > 1:`
			`ambiguous.append([p[:-3], '\n'.join(f[1] for f in files)])`
			`if nomatched:`
			`table = [['Not matched patterns'], *nomatched]`
			`err_msg += tabulate.tabulate(table,`
			`headers='firstrow',`
			`tablefmt='psql')`
			`if ambiguous:`
			`table = [['Ambiguous patterns', 'Matched files'], *ambiguous]`
			`err_msg += tabulate.tabulate(table,`
			`headers='firstrow',`
			`tablefmt='psql')`
			`raise ValueError(err_msg)`
			`return files`


[Sync] update taco (#1030) 2024-04-09 17:50:23 +08:00			`def try_fill_in_custom_cfgs(config):`
			`for i, dataset in enumerate(config['datasets']):`
			`if 'type' not in dataset:`
			`config['datasets'][i] = make_custom_dataset_config(dataset)`
			`if 'model_dataset_combinations' not in config:`
			`return config`
			`for mdc in config['model_dataset_combinations']:`
			`for i, dataset in enumerate(mdc['datasets']):`
			`if 'type' not in dataset:`
			`mdc['datasets'][i] = make_custom_dataset_config(dataset)`
			`return config`


[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`def get_config_from_arg(args) -> Config:`
			`"""Get the config object given args.`

			`Only a few argument combinations are accepted (priority from high to low)`
			`1. args.config`
			`2. args.models and args.datasets`
			`3. Huggingface parameter groups and args.datasets`
			`"""`
			`if args.config:`
[Sync] update configs (#734) 2023-12-25 21:59:16 +08:00			`config = Config.fromfile(args.config, format_python_code=False)`
[Sync] update taco (#1030) 2024-04-09 17:50:23 +08:00			`config = try_fill_in_custom_cfgs(config)`
[Sync] deprecate old mbpps (#1064) 2024-04-19 20:49:46 +08:00			`# set infer accelerator if needed`
			`if args.accelerator in ['vllm', 'lmdeploy']:`
			`config['models'] = change_accelerator(config['models'],`
			`args.accelerator)`
[Feature] Support Math evaluation via judgemodel (#1094) * support openai math evaluation * support openai math evaluation * support openai math evaluation * support math llm judge * support math llm judge 2024-04-26 14:56:23 +08:00			`if 'eval' in config and 'partitioner' in config['eval']:`
			`if 'models' in config['eval']['partitioner']:`
			`config['eval']['partitioner'][`
			`'models'] = change_accelerator(`
			`config['eval']['partitioner']['models'],`
			`args.accelerator)`
			`if 'judge_models' in config['eval']['partitioner']:`
			`config['eval']['partitioner'][`
			`'judge_models'] = change_accelerator(`
			`config['eval']['partitioner']['judge_models'],`
			`args.accelerator)`
[Sync] update configs (#734) 2023-12-25 21:59:16 +08:00			`return config`
			`# parse dataset args`
			`if not args.datasets and not args.custom_dataset_path:`
			`raise ValueError('You must specify "--datasets" or '`
			`'"--custom-dataset-path" if you do not specify a '`
			`'config file path.')`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`datasets = []`
[Sync] update configs (#734) 2023-12-25 21:59:16 +08:00			`if args.datasets:`
			`datasets_dir = os.path.join(args.config_dir, 'datasets')`
[Fix] Refactor Needlebench Configs for CLI Testing Support (#1020) * add needlebench datasets suffix * fix import * update run.py args for summarizer key and dataset suffix * update utils/run.py 2024-04-07 15:12:56 +08:00			`for dataset_arg in args.datasets:`
			`if '/' in dataset_arg:`
			`dataset_name, dataset_suffix = dataset_arg.split('/', 1)`
			`dataset_key_suffix = dataset_suffix`
			`else:`
			`dataset_name = dataset_arg`
			`dataset_key_suffix = '_datasets'`

			`for dataset in match_cfg_file(datasets_dir, [dataset_name]):`
			`get_logger().info(f'Loading {dataset[0]}: {dataset[1]}')`
			`cfg = Config.fromfile(dataset[1])`
			`for k in cfg.keys():`
			`if k.endswith(dataset_key_suffix):`
			`datasets += cfg[k]`
[Sync] update configs (#734) 2023-12-25 21:59:16 +08:00			`else:`
			`dataset = {'path': args.custom_dataset_path}`
			`if args.custom_dataset_infer_method is not None:`
			`dataset['infer_method'] = args.custom_dataset_infer_method`
			`if args.custom_dataset_data_type is not None:`
			`dataset['data_type'] = args.custom_dataset_data_type`
			`if args.custom_dataset_meta_path is not None:`
			`dataset['meta_path'] = args.custom_dataset_meta_path`
			`dataset = make_custom_dataset_config(dataset)`
			`datasets.append(dataset)`

			`# parse model args`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`if not args.models and not args.hf_path:`
			`raise ValueError('You must specify a config file path, '`
			`'or specify --models and --datasets, or '`
			`'specify HuggingFace model parameters and '`
			`'--datasets.')`
			`models = []`
			`if args.models:`
[Feature] support customize config path (#423) * support customize config path * support customize config path * support customize config path 2023-09-22 19:12:02 +08:00			`model_dir = os.path.join(args.config_dir, 'models')`
			`for model in match_cfg_file(model_dir, args.models):`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`get_logger().info(f'Loading {model[0]}: {model[1]}')`
			`cfg = Config.fromfile(model[1])`
			`if 'models' not in cfg:`
			`raise ValueError(`
			`f'Config file {model[1]} does not contain "models" field')`
			`models += cfg['models']`
			`else:`
			`from opencompass.models import HuggingFace`
			`model = dict(type=f'{HuggingFace.__module__}.{HuggingFace.__name__}',`
			`path=args.hf_path,`
			`peft_path=args.peft_path,`
			`tokenizer_path=args.tokenizer_path,`
			`model_kwargs=args.model_kwargs,`
			`tokenizer_kwargs=args.tokenizer_kwargs,`
			`max_seq_len=args.max_seq_len,`
			`max_out_len=args.max_out_len,`
			`batch_padding=not args.no_batch_padding,`
			`batch_size=args.batch_size,`
[Fix] Fix when missing both pad and eos token (#287) * fix when missing both pad and eos token * update pad_token_id impl 2023-08-31 16:53:39 +08:00			`pad_token_id=args.pad_token_id,`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`run_cfg=dict(num_gpus=args.num_gpus))`
			`models.append(model)`
[Sync] deprecate old mbpps (#1064) 2024-04-19 20:49:46 +08:00			`# set infer accelerator if needed`
			`if args.accelerator in ['vllm', 'lmdeploy']:`
			`models = change_accelerator(models, args.accelerator)`
[Sync] update configs (#734) 2023-12-25 21:59:16 +08:00			`# parse summarizer args`
[Fix] Refactor Needlebench Configs for CLI Testing Support (#1020) * add needlebench datasets suffix * fix import * update run.py args for summarizer key and dataset suffix * update utils/run.py 2024-04-07 15:12:56 +08:00			`summarizer_arg = args.summarizer if args.summarizer is not None \`
			`else 'example'`
use example summarizer by default (#508) 2023-10-27 11:45:29 +08:00			`summarizers_dir = os.path.join(args.config_dir, 'summarizers')`
[Fix] Refactor Needlebench Configs for CLI Testing Support (#1020) * add needlebench datasets suffix * fix import * update run.py args for summarizer key and dataset suffix * update utils/run.py 2024-04-07 15:12:56 +08:00
			`# Check if summarizer_arg contains '/'`
			`if '/' in summarizer_arg:`
			`# If it contains '/', split the string by '/'`
			`# and use the second part as the configuration key`
			`summarizer_file, summarizer_key = summarizer_arg.split('/', 1)`
			`else:`
			`# If it does not contain '/', keep the original logic unchanged`
			`summarizer_key = 'summarizer'`
			`summarizer_file = summarizer_arg`

			`s = match_cfg_file(summarizers_dir, [summarizer_file])[0]`
use example summarizer by default (#508) 2023-10-27 11:45:29 +08:00			`get_logger().info(f'Loading {s[0]}: {s[1]}')`
			`cfg = Config.fromfile(s[1])`
[Fix] Refactor Needlebench Configs for CLI Testing Support (#1020) * add needlebench datasets suffix * fix import * update run.py args for summarizer key and dataset suffix * update utils/run.py 2024-04-07 15:12:56 +08:00			`# Use summarizer_key to retrieve the summarizer definition`
			`# from the configuration file`
			`summarizer = cfg[summarizer_key]`
[Feat] add custom summarizer argument in CLI run mode 在CLI启动模式中添加自定义Summarizer参数 (#411) * feat: add custom summarizer in CLI run mode * feat: search local config by match_cfg_file 2023-09-18 18:11:22 +08:00
[Model] Yhzhang/add mlugowl llamaadapter (#405) * refine gitignore * [Feature]: Add minigpt-4 * [Feature]: Add mm local runner * [Feature]: Add instructblip * add otter and llama-adapter * add owl * add llama2-adapter and owl * lint * [Feature]: Add minigpt-4 * [Feature]: Add instructblip * add otter and llama-adapter * add owl * add llama2-adapter and owl * lint * lint * update * lint * lint * add __init__.py * update * update * update * update * [Feature]: Add minigpt-4 * [Feature]: Add mm local runner * [Feature]: Add instructblip * add otter and llama-adapter * add owl * add llama2-adapter and owl * lint * [Feature]: Add minigpt-4 * [Feature]: Add instructblip * add otter and llama-adapter * add owl * add llama2-adapter and owl * lint * lint * update * lint * lint * add __init__.py * update * update * update * update * optimize mmbench dataset args * update * update * run commit hook --------- Co-authored-by: liuyuan <3463423099@qq.com> Co-authored-by: kennymckormick <dhd@pku.edu.cn> Co-authored-by: kennymckormick <dhd.efz@gmail.com> 2023-09-19 14:21:26 +08:00			`return Config(dict(models=models, datasets=datasets,`
			`summarizer=summarizer),`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`format_python_code=False)`


[Sync] deprecate old mbpps (#1064) 2024-04-19 20:49:46 +08:00			`def change_accelerator(models, accelerator):`
			`models = models.copy()`
			`model_accels = []`
			`for model in models:`
			`get_logger().info(f'Transforming {model["abbr"]} to {accelerator}')`
			`# change HuggingFace model to VLLM or TurboMindModel`
			`if model['type'] is HuggingFaceCausalLM:`
			`gen_args = dict()`
			`if model.get('generation_kwargs') is not None:`
			`generation_kwargs = model['generation_kwargs'].copy()`
			`gen_args['temperature'] = 0.001 if generation_kwargs.get(`
			`'temperature'`
			`) is None else generation_kwargs['temperature']`
			`gen_args['top_k'] = 1 if generation_kwargs.get(`
			`'top_k') is None else generation_kwargs['top_k']`
			`gen_args['top_p'] = 0.9 if generation_kwargs.get(`
			`'top_p') is None else generation_kwargs['top_p']`
			`gen_args['stop_token_ids'] = None if generation_kwargs.get(`
			`'eos_token_id'`
			`) is None else generation_kwargs['eos_token_id']`
			`generation_kwargs[`
			`'stop_token_ids'] = None if generation_kwargs.get(`
			`'eos_token_id'`
			`) is None else generation_kwargs['eos_token_id']`
			`generation_kwargs.pop('eos_token_id')`
			`else:`
			`# if generation_kwargs is not provided, set default values`
			`generation_kwargs = dict()`
			`gen_args['temperature'] = 0.0`
			`gen_args['top_k'] = 1`
			`gen_args['top_p'] = 0.9`
			`gen_args['stop_token_ids'] = None`

			`if accelerator == 'lmdeploy':`
			`get_logger().info(`
			`f'Transforming {model["abbr"]} to {accelerator}')`
			`model = dict(`
			`type= # noqa E251`
			`f'{TurboMindModel.__module__}.{TurboMindModel.__name__}',`
			`abbr=model['abbr'].replace('hf', 'lmdeploy')`
			`if '-hf' in model['abbr'] else model['abbr'] + '-lmdeploy',`
			`path=model['path'],`
			`engine_config=dict(session_len=model['max_seq_len'],`
			`max_batch_size=model['batch_size'],`
			`tp=model['run_cfg']['num_gpus']),`
			`gen_config=dict(top_k=gen_args['top_k'],`
			`temperature=gen_args['temperature'],`
			`top_p=gen_args['top_p'],`
			`max_new_tokens=model['max_out_len'],`
			`stop_words=gen_args['stop_token_ids']),`
			`max_out_len=model['max_out_len'],`
			`max_seq_len=model['max_seq_len'],`
			`batch_size=model['batch_size'],`
			`concurrency=model['batch_size'],`
			`run_cfg=model['run_cfg'],`
			`)`
			`for item in ['meta_template']:`
			`if model.get(item) is not None:`
			`model.update(item, model[item])`
			`elif accelerator == 'vllm':`
			`get_logger().info(`
			`f'Transforming {model["abbr"]} to {accelerator}')`

			`model = dict(`
			`type=f'{VLLM.__module__}.{VLLM.__name__}',`
			`abbr=model['abbr'].replace('hf', 'vllm')`
			`if '-hf' in model['abbr'] else model['abbr'] + '-vllm',`
			`path=model['path'],`
			`model_kwargs=dict(`
			`tensor_parallel_size=model['run_cfg']['num_gpus']),`
			`max_out_len=model['max_out_len'],`
			`max_seq_len=model['max_seq_len'],`
			`batch_size=model['batch_size'],`
			`generation_kwargs=generation_kwargs,`
			`run_cfg=model['run_cfg'],`
			`)`
			`for item in ['meta_template', 'end_str']:`
			`if model.get(item) is not None:`
			`model.update(item, model[item])`
			`generation_kwargs.update(`
			`dict(temperature=gen_args['temperature']))`
			`else:`
			`raise ValueError(f'Unsupported accelerator {accelerator}')`
			`model_accels.append(model)`
			`return model_accels`


[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`def get_config_type(obj) -> str:`
			`return f'{obj.__module__}.{obj.__name__}'`


			`def fill_infer_cfg(cfg, args):`
			`new_cfg = dict(infer=dict(`
			`partitioner=dict(type=get_config_type(SizePartitioner),`
			`max_task_size=args.max_partition_size,`
			`gen_task_coef=args.gen_task_coef),`
			`runner=dict(`
			`max_num_workers=args.max_num_workers,`
			`debug=args.debug,`
			`task=dict(type=get_config_type(OpenICLInferTask)),`
			`lark_bot_url=cfg['lark_bot_url'],`
			`)), )`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`if args.slurm:`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`new_cfg['infer']['runner']['type'] = get_config_type(SlurmRunner)`
			`new_cfg['infer']['runner']['partition'] = args.partition`
			`new_cfg['infer']['runner']['quotatype'] = args.quotatype`
			`new_cfg['infer']['runner']['qos'] = args.qos`
			`new_cfg['infer']['runner']['retry'] = args.retry`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`elif args.dlc:`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`new_cfg['infer']['runner']['type'] = get_config_type(DLCRunner)`
			`new_cfg['infer']['runner']['aliyun_cfg'] = Config.fromfile(`
			`args.aliyun_cfg)`
			`new_cfg['infer']['runner']['retry'] = args.retry`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`else:`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`new_cfg['infer']['runner']['type'] = get_config_type(LocalRunner)`
			`new_cfg['infer']['runner'][`
			`'max_workers_per_gpu'] = args.max_workers_per_gpu`
			`cfg.merge_from_dict(new_cfg)`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00

[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`def fill_eval_cfg(cfg, args):`
			`new_cfg = dict(`
			`eval=dict(partitioner=dict(type=get_config_type(NaivePartitioner)),`
			`runner=dict(`
			`max_num_workers=args.max_num_workers,`
			`debug=args.debug,`
			`task=dict(type=get_config_type(OpenICLEvalTask)),`
			`lark_bot_url=cfg['lark_bot_url'],`
			`)))`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`if args.slurm:`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`new_cfg['eval']['runner']['type'] = get_config_type(SlurmRunner)`
			`new_cfg['eval']['runner']['partition'] = args.partition`
			`new_cfg['eval']['runner']['quotatype'] = args.quotatype`
			`new_cfg['eval']['runner']['qos'] = args.qos`
			`new_cfg['eval']['runner']['retry'] = args.retry`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`elif args.dlc:`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`new_cfg['eval']['runner']['type'] = get_config_type(DLCRunner)`
			`new_cfg['eval']['runner']['aliyun_cfg'] = Config.fromfile(`
			`args.aliyun_cfg)`
			`new_cfg['eval']['runner']['retry'] = args.retry`
[Feature] Simplify entry script (#204) * [Feature] Simply entry script * update 2023-08-25 17:36:30 +08:00			`else:`
[Sync] Use finally to clean up temp files (#337) 2023-09-04 15:20:16 +08:00			`new_cfg['eval']['runner']['type'] = get_config_type(LocalRunner)`
			`new_cfg['eval']['runner'][`
			`'max_workers_per_gpu'] = args.max_workers_per_gpu`
			`cfg.merge_from_dict(new_cfg)`