OpenCompass/configs/models/qwen/hf_qwen_7b.py

from opencompass.models import HuggingFaceCausalLM

# Please note that we have specified the revision here. Recently (on 20230827),
# during our evaluations, we found that the newer revision models have a drop
# of more than 5 points on datasets like GaokaoBench / mbpp.
# We are not yet sure whether this drop is due to incorrect logic in OpenCompass
# calling qwen or some other reasons. We would like to highlight this.

models = [
    dict(
        type=HuggingFaceCausalLM,
        abbr='qwen-7b-hf',
        path="Qwen/Qwen-7B",
        tokenizer_path='Qwen/Qwen-7B',
        tokenizer_kwargs=dict(
            padding_side='left',
            truncation_side='left',
            trust_remote_code=True,
            use_fast=False,
            revision='39fc5fdcb95c8c367bbdb3bfc0db71d96266de09'
        ),
        pad_token_id=151643,
        max_out_len=100,
        max_seq_len=2048,
        batch_size=8,
        model_kwargs=dict(
            device_map='auto',
            trust_remote_code=True,
            revision='39fc5fdcb95c8c367bbdb3bfc0db71d96266de09'
        ),
        run_cfg=dict(num_gpus=1, num_procs=1),
    )
]
[Feature] Add qwen & qwen-chat support (#286) * add and apply update suffix tool * add tool doc * add qwen configs * add cmmlu * rename bbh * update datasets * delete * update hf_qwen_7b.py 2023-08-31 11:29:05 +08:00			`from opencompass.models import HuggingFaceCausalLM`

			`# Please note that we have specified the revision here. Recently (on 20230827),`
			`# during our evaluations, we found that the newer revision models have a drop`
			`# of more than 5 points on datasets like GaokaoBench / mbpp.`
			`# We are not yet sure whether this drop is due to incorrect logic in OpenCompass`
			`# calling qwen or some other reasons. We would like to highlight this.`

			`models = [`
			`dict(`
			`type=HuggingFaceCausalLM,`
			`abbr='qwen-7b-hf',`
			`path="Qwen/Qwen-7B",`
			`tokenizer_path='Qwen/Qwen-7B',`
			`tokenizer_kwargs=dict(`
			`padding_side='left',`
			`truncation_side='left',`
			`trust_remote_code=True,`
			`use_fast=False,`
			`revision='39fc5fdcb95c8c367bbdb3bfc0db71d96266de09'`
			`),`
[Fix] update qwen config (#358) 2023-09-05 10:15:19 +08:00			`pad_token_id=151643,`
[Feature] Add qwen & qwen-chat support (#286) * add and apply update suffix tool * add tool doc * add qwen configs * add cmmlu * rename bbh * update datasets * delete * update hf_qwen_7b.py 2023-08-31 11:29:05 +08:00			`max_out_len=100,`
			`max_seq_len=2048,`
			`batch_size=8,`
			`model_kwargs=dict(`
			`device_map='auto',`
			`trust_remote_code=True,`
			`revision='39fc5fdcb95c8c367bbdb3bfc0db71d96266de09'`
			`),`
			`run_cfg=dict(num_gpus=1, num_procs=1),`
			`)`
			`]`