From b83396f57ca5836ee74b01e8a32ce6f26117cf58 Mon Sep 17 00:00:00 2001
From: Mo Li <2568818204@qq.com>
Date: Wed, 31 Jul 2024 14:53:51 +0800
Subject: [PATCH] add 1m config (#1383)

---
 configs/models/hf_internlm/lmdeploy_internlm2_5_7b_chat_1m.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/configs/models/hf_internlm/lmdeploy_internlm2_5_7b_chat_1m.py b/configs/models/hf_internlm/lmdeploy_internlm2_5_7b_chat_1m.py
index 09d34dd1..6d96de28 100644
--- a/configs/models/hf_internlm/lmdeploy_internlm2_5_7b_chat_1m.py
+++ b/configs/models/hf_internlm/lmdeploy_internlm2_5_7b_chat_1m.py
@@ -5,7 +5,7 @@ models = [
         type=TurboMindModelwithChatTemplate,
         abbr='internlm2_5-7b-chat-1m-turbomind',
         path='internlm/internlm2_5-7b-chat-1m',
-        engine_config=dict(rope_scaling_factor=2.5, session_len=1048576, max_batch_size=1, tp=4), # 1M context length
+        engine_config=dict(rope_scaling_factor=2.5, session_len=1048576, max_batch_size=1, cache_max_entry_count=0.7, tp=4), # 1M context length
         gen_config=dict(top_k=1, temperature=1e-6, top_p=0.9, max_new_tokens=2048),
         max_seq_len=1048576,
         max_out_len=2048,