mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
[Feature] Support 3 models (#34)
opencompass/configs/models/deepseek/lmdeploy_deepseek_r1_distill_llama_70b_instruct.py opencompass/configs/models/deepseek/lmdeploy_deepseek_r1_distill_qwen_14b_instruct.py opencompass/configs/models/hf_llama/llama3_3_70b_api_siliconflow.py
This commit is contained in:
parent
879b181c1b
commit
362b281e55
@ -0,0 +1,16 @@
|
||||
from opencompass.models import TurboMindModelwithChatTemplate
|
||||
|
||||
models = [
|
||||
dict(
|
||||
type=TurboMindModelwithChatTemplate,
|
||||
abbr='deepseek_r1_distill_llama_70b_turbomind',
|
||||
path='deepseek-ai/DeepSeek-R1-Distill-Llama-70B',
|
||||
engine_config=dict(max_batch_size=16, tp=4),
|
||||
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9, max_new_tokens=8192),
|
||||
max_seq_len=16384,
|
||||
max_out_len=8192,
|
||||
batch_size=16,
|
||||
run_cfg=dict(num_gpus=4),
|
||||
stop_words=['<|end_of_text|>', '<|eot_id|>', '<|eom_id|>'],
|
||||
)
|
||||
]
|
@ -0,0 +1,15 @@
|
||||
from opencompass.models import TurboMindModelwithChatTemplate
|
||||
|
||||
models = [
|
||||
dict(
|
||||
type=TurboMindModelwithChatTemplate,
|
||||
abbr='deepseek_r1_distill_qwen_14b_turbomind',
|
||||
path='deepseek-ai/DeepSeek-R1-Distill-Qwen-14B',
|
||||
engine_config=dict(session_len=16384, max_batch_size=16, tp=2),
|
||||
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9, max_new_tokens=4096),
|
||||
max_seq_len=16384,
|
||||
max_out_len=4096,
|
||||
batch_size=16,
|
||||
run_cfg=dict(num_gpus=2),
|
||||
)
|
||||
]
|
@ -0,0 +1,17 @@
|
||||
from opencompass.models import OpenAISDK
|
||||
|
||||
models = [
|
||||
dict(
|
||||
abbr='llama3_3_70b_api_siliconflow',
|
||||
type=OpenAISDK,
|
||||
path='meta-llama/Llama-3.3-70B-Instruct',
|
||||
key='ENV_SILICONFLOW',
|
||||
openai_api_base='https://api.siliconflow.cn/v1/',
|
||||
query_per_second=1,
|
||||
max_out_len=4096,
|
||||
max_seq_len=4096,
|
||||
batch_size=1,
|
||||
retry=30,
|
||||
verbose=True,
|
||||
),
|
||||
]
|
Loading…
Reference in New Issue
Block a user