OpenCompass/opencompass/configs/models/qwen/lmdeploy_qwen1_5_110b.py

16 lines
467 B
Python
Raw Normal View History

from opencompass.models import TurboMindModel
models = [
dict(
type=TurboMindModel,
abbr='qwen1.5-110b-turbomind',
path='Qwen/Qwen1.5-110B',
engine_config=dict(session_len=7168, max_batch_size=8, tp=8, cache_max_entry_count=0.6),
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9, max_new_tokens=1024),
max_seq_len=7168,
max_out_len=1024,
batch_size=8,
run_cfg=dict(num_gpus=8),
)
]