mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
[Update] Add lmdeploy DeepSeek configs (#1656)
* [Update] Add lmdeploy DeepSeek configs * update max out length
This commit is contained in:
parent
a0853c939d
commit
695738a89b
18
opencompass/configs/models/deepseek/lmdeploy_deepseek_v2.py
Normal file
18
opencompass/configs/models/deepseek/lmdeploy_deepseek_v2.py
Normal file
@ -0,0 +1,18 @@
|
|||||||
|
# flake8: noqa
|
||||||
|
from mmengine.config import read_base
|
||||||
|
from opencompass.models import (
|
||||||
|
TurboMindModel,
|
||||||
|
)
|
||||||
|
lmdeploy_deepseek_v2_model = [
|
||||||
|
dict(
|
||||||
|
type=TurboMindModel,
|
||||||
|
abbr='deepseek-v2-turbomind',
|
||||||
|
path='deepseek-ai/DeepSeek-V2',
|
||||||
|
engine_config=dict(session_len=7168, max_batch_size=4, tp=8, cache_max_entry_count=0.7),
|
||||||
|
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9),
|
||||||
|
max_seq_len=7168,
|
||||||
|
max_out_len=2048,
|
||||||
|
batch_size=4,
|
||||||
|
run_cfg=dict(num_gpus=8),
|
||||||
|
)
|
||||||
|
]
|
@ -0,0 +1,20 @@
|
|||||||
|
from opencompass.models import TurboMindModelwithChatTemplate
|
||||||
|
|
||||||
|
models = [
|
||||||
|
dict(
|
||||||
|
type=TurboMindModelwithChatTemplate,
|
||||||
|
abbr='deepseek-v2_5-turbomind',
|
||||||
|
path='deepseek-ai/DeepSeek-V2.5',
|
||||||
|
engine_config=dict(
|
||||||
|
session_len=7168,
|
||||||
|
max_batch_size=4,
|
||||||
|
tp=8,
|
||||||
|
cache_max_entry_count=0.7,
|
||||||
|
),
|
||||||
|
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9),
|
||||||
|
max_seq_len=7168,
|
||||||
|
max_out_len=2048,
|
||||||
|
batch_size=4,
|
||||||
|
run_cfg=dict(num_gpus=8),
|
||||||
|
)
|
||||||
|
]
|
Loading…
Reference in New Issue
Block a user