mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
add rwkv-5-3b model (#666)
* support rwkv5-3b learnboard * update rwkv-5-3b config * update config * refine * fix bug * update config * refine * reduce batch size * refine * reduce batch size to avoid oom in special datasets * Update huggingface.py * Update huggingface.py
This commit is contained in:
parent
4780b39eda
commit
82a533a690
6
configs/eval_rwkv5_3b.py
Normal file
6
configs/eval_rwkv5_3b.py
Normal file
@ -0,0 +1,6 @@
|
|||||||
|
from mmengine.config import read_base
|
||||||
|
|
||||||
|
with read_base():
|
||||||
|
from .models.rwkv.rwkv5_3b import models
|
||||||
|
from .datasets.collections.base_medium_llama import datasets
|
||||||
|
from .summarizers.leaderboard import summarizer
|
25
configs/models/rwkv/rwkv5_3b.py
Normal file
25
configs/models/rwkv/rwkv5_3b.py
Normal file
@ -0,0 +1,25 @@
|
|||||||
|
from opencompass.models import HuggingFaceCausalLM
|
||||||
|
|
||||||
|
models = [
|
||||||
|
dict(
|
||||||
|
type=HuggingFaceCausalLM,
|
||||||
|
abbr='rwkv-5-3b',
|
||||||
|
path="RWKV/rwkv-5-world-3b",
|
||||||
|
tokenizer_path='RWKV/rwkv-5-world-3b',
|
||||||
|
model_kwargs=dict(
|
||||||
|
device_map='auto',
|
||||||
|
trust_remote_code=True,
|
||||||
|
),
|
||||||
|
tokenizer_kwargs=dict(
|
||||||
|
padding_side='left',
|
||||||
|
truncation_side='left',
|
||||||
|
trust_remote_code=True,
|
||||||
|
use_fast=False,
|
||||||
|
),
|
||||||
|
max_out_len=100,
|
||||||
|
max_seq_len=2048,
|
||||||
|
batch_padding=True,
|
||||||
|
batch_size=16,
|
||||||
|
run_cfg=dict(num_gpus=1, num_procs=1),
|
||||||
|
)
|
||||||
|
]
|
Loading…
Reference in New Issue
Block a user