mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00

* [Feature] Add Ruler datasets * pre-commit fixed * Add model specific tokenizer to dataset * pre-commit modified * remove unused import * fix linting * add trust_remote to tokenizer load * lint fix * comments resolved * fix lint * Add readme * Fix lint * ruler refactorize * fix lint * lint fix * updated * lint fix * fix wonderwords import issue * prompt modified * update * readme updated * update * ruler dataset added * Update --------- Co-authored-by: tonysy <sy.zhangbuaa@gmail.com>
39 lines
1.2 KiB
Python
39 lines
1.2 KiB
Python
from opencompass.partitioners import (
|
|
NaivePartitioner,
|
|
NumWorkerPartitioner,
|
|
)
|
|
from mmengine.config import read_base
|
|
from opencompass.runners import LocalRunner
|
|
from opencompass.tasks import OpenICLInferTask, OpenICLEvalTask
|
|
|
|
with read_base():
|
|
from ..configs.models.hf_internlm.lmdeploy_internlm2_5_7b_chat_1m import (
|
|
models as internlm2_5_7b_chat_1m,
|
|
)
|
|
from .datasets.ruler.ruler_combined_gen import ruler_combined_datasets
|
|
from ..configs.summarizers.groups.ruler import ruler_summary_groups
|
|
|
|
datasets = sum((v for k, v in locals().items() if k.endswith('_datasets')), [])
|
|
models = internlm2_5_7b_chat_1m
|
|
work_dir = './outputs/ruler'
|
|
|
|
|
|
infer = dict(
|
|
partitioner=dict(type=NumWorkerPartitioner, num_worker=2),
|
|
runner=dict(
|
|
type=LocalRunner, max_num_workers=16, task=dict(type=OpenICLInferTask), retry=5
|
|
),
|
|
)
|
|
|
|
eval = dict(
|
|
partitioner=dict(type=NaivePartitioner),
|
|
runner=dict(type=LocalRunner, max_num_workers=32, task=dict(type=OpenICLEvalTask)),
|
|
)
|
|
|
|
summarizer = dict(
|
|
dataset_abbrs=['ruler_4k', 'ruler_8k', 'ruler_16k', 'ruler_32k'],
|
|
summary_groups=sum(
|
|
[v for k, v in locals().items() if k.endswith('_summary_groups')], []
|
|
),
|
|
)
|