2024-12-31 15:17:39 +08:00
|
|
|
from mmengine.config import read_base
|
|
|
|
|
2025-01-20 19:17:38 +08:00
|
|
|
from opencompass.models import OpenAISDK
|
2024-12-31 15:17:39 +08:00
|
|
|
|
|
|
|
with read_base():
|
|
|
|
# 选择一个数据集列表
|
2025-01-20 19:17:38 +08:00
|
|
|
from opencompass.configs.datasets.livestembench.livestembench_gen_3e3c50 import \
|
|
|
|
livestembench_datasets
|
2024-12-31 15:17:39 +08:00
|
|
|
# 选择一个感兴趣的模型
|
2025-01-20 19:17:38 +08:00
|
|
|
from opencompass.configs.models.qwen2_5.lmdeploy_qwen2_5_7b_instruct import \
|
|
|
|
models as qwen2_5_7b_instruct_lmdeploy_model
|
|
|
|
from opencompass.configs.models.qwen2_5.lmdeploy_qwen2_5_72b_instruct import \
|
|
|
|
models as qwen2_5_72b_instruct_lmdeploy_model
|
2024-12-31 15:17:39 +08:00
|
|
|
|
|
|
|
datasets = sum([v for k, v in locals().items() if k.endswith('_datasets')], [])
|
2025-01-20 19:17:38 +08:00
|
|
|
models = [
|
|
|
|
*qwen2_5_7b_instruct_lmdeploy_model, *qwen2_5_72b_instruct_lmdeploy_model
|
|
|
|
]
|
2024-12-31 15:17:39 +08:00
|
|
|
|
|
|
|
# Judge 模型配置
|
|
|
|
api_meta_template = dict(round=[
|
|
|
|
dict(role='HUMAN', api_role='HUMAN'),
|
|
|
|
dict(role='BOT', api_role='BOT', generate=True),
|
|
|
|
], )
|
|
|
|
|
|
|
|
judge_cfg = dict(
|
2025-01-20 19:17:38 +08:00
|
|
|
abbr='qwen2-5-72b-instruct',
|
|
|
|
type=OpenAISDK,
|
|
|
|
path='YOUR_SERVER_MODEL_NAME', # 你的部署的模型名称
|
|
|
|
key='None',
|
|
|
|
openai_api_base=[
|
|
|
|
'http://localhost:23333/v1', # 你的模型部署的地址
|
|
|
|
],
|
|
|
|
meta_template=api_meta_template,
|
|
|
|
query_per_second=16,
|
|
|
|
batch_size=16,
|
|
|
|
temperature=0.001,
|
|
|
|
max_completion_tokens=32768,
|
2024-12-31 15:17:39 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
for dataset in datasets:
|
|
|
|
dataset['eval_cfg']['evaluator']['judge_cfg'] = judge_cfg
|
|
|
|
|
|
|
|
# -------------Inferen Stage ----------------------------------------
|
|
|
|
|
2025-01-20 19:17:38 +08:00
|
|
|
from opencompass.partitioners import NaivePartitioner, NumWorkerPartitioner
|
2024-12-31 15:17:39 +08:00
|
|
|
from opencompass.runners import LocalRunner
|
2025-01-20 19:17:38 +08:00
|
|
|
from opencompass.tasks import OpenICLEvalTask, OpenICLInferTask
|
2024-12-31 15:17:39 +08:00
|
|
|
|
|
|
|
infer = dict(
|
|
|
|
partitioner=dict(type=NumWorkerPartitioner, num_worker=8),
|
2025-01-20 19:17:38 +08:00
|
|
|
runner=dict(type=LocalRunner,
|
|
|
|
max_num_workers=8,
|
|
|
|
task=dict(type=OpenICLInferTask)),
|
2024-12-31 15:17:39 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
eval = dict(
|
|
|
|
partitioner=dict(type=NaivePartitioner, n=8),
|
|
|
|
runner=dict(
|
|
|
|
type=LocalRunner,
|
|
|
|
max_num_workers=256,
|
|
|
|
task=dict(type=OpenICLEvalTask),
|
|
|
|
),
|
|
|
|
)
|
|
|
|
|
|
|
|
work_dir = './outputs/livestembench'
|