from opencompass.models.turbomind import TurboMindModel _meta_template = dict( round=[ dict(role='HUMAN', begin='<|im_start|>user\n', end='<|im_end|>\n'), dict(role='BOT', begin='<|im_start|>assistant\n', end='<|im_end|>\n', generate=True), ], ) models = [ dict( type=TurboMindModel, abbr='internlm2-chat-7b-turbomind', path='internlm/internlm2-chat-7b', meta_template=_meta_template, engine_config=dict( session_len=32768, max_batch_size=32, model_name='internlm2-chat-7b', tp=1, stop_words=[2, 92542], ), gen_config=dict( top_k=1, top_p=0.8, temperature=1.0, max_new_tokens=2000, ), max_out_len=2000, max_seq_len=32768, batch_size=32, concurrency=8, run_cfg=dict(num_gpus=1, num_procs=1), ) ]