[Update] Add lmdeploy DeepSeek configs (#1656)

* [Update] Add lmdeploy DeepSeek configs

* update max out length
This commit is contained in:
Linchen Xiao 2024-11-01 15:34:23 +08:00 committed by GitHub
parent a0853c939d
commit 695738a89b
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 38 additions and 0 deletions

View File

@ -0,0 +1,18 @@
# flake8: noqa
from mmengine.config import read_base
from opencompass.models import (
TurboMindModel,
)
lmdeploy_deepseek_v2_model = [
dict(
type=TurboMindModel,
abbr='deepseek-v2-turbomind',
path='deepseek-ai/DeepSeek-V2',
engine_config=dict(session_len=7168, max_batch_size=4, tp=8, cache_max_entry_count=0.7),
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9),
max_seq_len=7168,
max_out_len=2048,
batch_size=4,
run_cfg=dict(num_gpus=8),
)
]

View File

@ -0,0 +1,20 @@
from opencompass.models import TurboMindModelwithChatTemplate
models = [
dict(
type=TurboMindModelwithChatTemplate,
abbr='deepseek-v2_5-turbomind',
path='deepseek-ai/DeepSeek-V2.5',
engine_config=dict(
session_len=7168,
max_batch_size=4,
tp=8,
cache_max_entry_count=0.7,
),
gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9),
max_seq_len=7168,
max_out_len=2048,
batch_size=4,
run_cfg=dict(num_gpus=8),
)
]