mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
[Update] Add lmdeploy DeepSeek configs (#1656)
* [Update] Add lmdeploy DeepSeek configs * update max out length
This commit is contained in:
parent
a0853c939d
commit
695738a89b
18
opencompass/configs/models/deepseek/lmdeploy_deepseek_v2.py
Normal file
18
opencompass/configs/models/deepseek/lmdeploy_deepseek_v2.py
Normal file
@ -0,0 +1,18 @@
|
||||
# flake8: noqa
|
||||
from mmengine.config import read_base
|
||||
from opencompass.models import (
|
||||
TurboMindModel,
|
||||
)
|
||||
lmdeploy_deepseek_v2_model = [
|
||||
dict(
|
||||
type=TurboMindModel,
|
||||
abbr='deepseek-v2-turbomind',
|
||||
path='deepseek-ai/DeepSeek-V2',
|
||||
engine_config=dict(session_len=7168, max_batch_size=4, tp=8, cache_max_entry_count=0.7),
|
||||
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9),
|
||||
max_seq_len=7168,
|
||||
max_out_len=2048,
|
||||
batch_size=4,
|
||||
run_cfg=dict(num_gpus=8),
|
||||
)
|
||||
]
|
@ -0,0 +1,20 @@
|
||||
from opencompass.models import TurboMindModelwithChatTemplate
|
||||
|
||||
models = [
|
||||
dict(
|
||||
type=TurboMindModelwithChatTemplate,
|
||||
abbr='deepseek-v2_5-turbomind',
|
||||
path='deepseek-ai/DeepSeek-V2.5',
|
||||
engine_config=dict(
|
||||
session_len=7168,
|
||||
max_batch_size=4,
|
||||
tp=8,
|
||||
cache_max_entry_count=0.7,
|
||||
),
|
||||
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9),
|
||||
max_seq_len=7168,
|
||||
max_out_len=2048,
|
||||
batch_size=4,
|
||||
run_cfg=dict(num_gpus=8),
|
||||
)
|
||||
]
|
Loading…
Reference in New Issue
Block a user