2023-07-05 09:27:28 +08:00
|
|
|
from opencompass.models import HuggingFaceCausalLM
|
|
|
|
|
|
|
|
models = [
|
2023-07-06 16:02:39 +08:00
|
|
|
# LLaMA 30B
|
2023-07-05 09:27:28 +08:00
|
|
|
dict(
|
|
|
|
type=HuggingFaceCausalLM,
|
2023-07-06 16:02:39 +08:00
|
|
|
abbr='llama-30b-hf',
|
2023-07-25 10:21:31 +08:00
|
|
|
path="huggyllama/llama-30b",
|
|
|
|
tokenizer_path='huggyllama/llama-30b',
|
2023-07-05 09:27:28 +08:00
|
|
|
tokenizer_kwargs=dict(padding_side='left',
|
|
|
|
truncation_side='left',
|
|
|
|
use_fast=False,
|
|
|
|
),
|
|
|
|
max_out_len=100,
|
|
|
|
max_seq_len=2048,
|
|
|
|
batch_size=8,
|
|
|
|
model_kwargs=dict(device_map='auto'),
|
2023-07-06 16:02:39 +08:00
|
|
|
batch_padding=False, # if false, inference with for-loop without batch padding
|
|
|
|
run_cfg=dict(num_gpus=4, num_procs=1),
|
2023-07-05 09:27:28 +08:00
|
|
|
)
|
|
|
|
]
|