2024-06-28 14:16:34 +08:00
|
|
|
from opencompass.models import TurboMindModelwithChatTemplate
|
2024-05-14 14:50:16 +08:00
|
|
|
|
|
|
|
models = [
|
|
|
|
dict(
|
2024-06-28 14:16:34 +08:00
|
|
|
type=TurboMindModelwithChatTemplate,
|
|
|
|
abbr='llama-3-8b-instruct-turbomind',
|
2024-05-14 14:50:16 +08:00
|
|
|
path='meta-llama/Meta-Llama-3-8B-Instruct',
|
2024-06-28 14:16:34 +08:00
|
|
|
engine_config=dict(max_batch_size=16, tp=1),
|
2024-09-24 21:52:28 +08:00
|
|
|
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9, max_new_tokens=4096),
|
|
|
|
max_seq_len=16384,
|
|
|
|
max_out_len=4096,
|
2024-05-14 14:50:16 +08:00
|
|
|
batch_size=16,
|
|
|
|
run_cfg=dict(num_gpus=1),
|
2024-06-28 14:16:34 +08:00
|
|
|
stop_words=['<|end_of_text|>', '<|eot_id|>'],
|
2024-05-14 14:50:16 +08:00
|
|
|
)
|
|
|
|
]
|