mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00
Update datasets_info & hf_path
This commit is contained in:
parent
442c829e0f
commit
b6d1bc60dc
@ -128,6 +128,24 @@
|
|||||||
paper: https://arxiv.org/abs/2501.18362
|
paper: https://arxiv.org/abs/2501.18362
|
||||||
configpath: opencompass/configs/datasets/MedXpertQA/MedXpertQA_gen.py
|
configpath: opencompass/configs/datasets/MedXpertQA/MedXpertQA_gen.py
|
||||||
configpath_llmjudge: opencompass/configs/datasets/MedXpertQA/MedXpertQA_llmjudge_gen.py
|
configpath_llmjudge: opencompass/configs/datasets/MedXpertQA/MedXpertQA_llmjudge_gen.py
|
||||||
|
- ClinicBench:
|
||||||
|
name: ClinicBench
|
||||||
|
category: Knowledge / Medicine
|
||||||
|
paper: https://arxiv.org/abs/2405.00716
|
||||||
|
configpath: ''
|
||||||
|
configpath_llmjudge: opencompass/configs/datasets/ClinicBench/ClinicBench_llmjudge_gen.py
|
||||||
|
- ScienceQA:
|
||||||
|
name: ScienceQA
|
||||||
|
category: Knowledge / Medicine
|
||||||
|
paper: https://arxiv.org/abs/2209.09513
|
||||||
|
configpath: ''
|
||||||
|
configpath_llmjudge: opencompass/configs/datasets/ScienceQA/ScienceQA_llmjudge_gen.py
|
||||||
|
- PubMedQA:
|
||||||
|
name: PubMedQA
|
||||||
|
category: Knowledge / Medicine
|
||||||
|
paper: https://arxiv.org/abs/1909.06146
|
||||||
|
configpath: ''
|
||||||
|
configpath_llmjudge: opencompass/configs/datasets/PubMedQA/PubMedQA_llmjudge_gen.py
|
||||||
- musr:
|
- musr:
|
||||||
name: MuSR
|
name: MuSR
|
||||||
category: Reasoning
|
category: Reasoning
|
||||||
|
@ -45,7 +45,6 @@ ClinicBench_datasets = []
|
|||||||
ClinicBench_reader_cfg = dict(
|
ClinicBench_reader_cfg = dict(
|
||||||
input_columns=['question', 'choices'],
|
input_columns=['question', 'choices'],
|
||||||
output_column='label',
|
output_column='label',
|
||||||
test_split='validation',
|
|
||||||
)
|
)
|
||||||
|
|
||||||
ClinicBench_infer_cfg = dict(
|
ClinicBench_infer_cfg = dict(
|
||||||
|
@ -39,7 +39,6 @@ PubMedQA_datasets = []
|
|||||||
PubMedQA_reader_cfg = dict(
|
PubMedQA_reader_cfg = dict(
|
||||||
input_columns=['question', 'choices'],
|
input_columns=['question', 'choices'],
|
||||||
output_column='label',
|
output_column='label',
|
||||||
test_split='validation',
|
|
||||||
)
|
)
|
||||||
|
|
||||||
PubMedQA_infer_cfg = dict(
|
PubMedQA_infer_cfg = dict(
|
||||||
|
@ -39,7 +39,6 @@ ScienceQA_datasets = []
|
|||||||
ScienceQA_reader_cfg = dict(
|
ScienceQA_reader_cfg = dict(
|
||||||
input_columns=['question', 'choices'],
|
input_columns=['question', 'choices'],
|
||||||
output_column='label',
|
output_column='label',
|
||||||
test_split='validation',
|
|
||||||
)
|
)
|
||||||
|
|
||||||
ScienceQA_infer_cfg = dict(
|
ScienceQA_infer_cfg = dict(
|
||||||
|
@ -1,6 +1,7 @@
|
|||||||
from datasets import Dataset, DatasetDict, load_dataset
|
from datasets import load_dataset
|
||||||
|
|
||||||
from opencompass.registry import LOAD_DATASET
|
from opencompass.registry import LOAD_DATASET
|
||||||
|
from opencompass.utils import get_data_path
|
||||||
|
|
||||||
from .base import BaseDataset
|
from .base import BaseDataset
|
||||||
|
|
||||||
@ -9,16 +10,12 @@ from .base import BaseDataset
|
|||||||
class ClinicBenchDataset(BaseDataset):
|
class ClinicBenchDataset(BaseDataset):
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def load_single():
|
def load_single(path):
|
||||||
dataset = load_dataset('xuxuxuxuxu/Pharmacology-QA')['train']
|
dataset = load_dataset(path)['train']
|
||||||
return dataset
|
return dataset
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def load(path):
|
def load(path):
|
||||||
train_dataset = Dataset.from_list([])
|
path = get_data_path(path)
|
||||||
val_dataset = ClinicBenchDataset.load_single()
|
dataset = ClinicBenchDataset.load_single(path)
|
||||||
dataset = DatasetDict({
|
|
||||||
'train': train_dataset,
|
|
||||||
'validation': val_dataset
|
|
||||||
})
|
|
||||||
return dataset
|
return dataset
|
||||||
|
@ -1,6 +1,7 @@
|
|||||||
from datasets import Dataset, DatasetDict, load_dataset
|
from datasets import Dataset, load_dataset
|
||||||
|
|
||||||
from opencompass.registry import LOAD_DATASET
|
from opencompass.registry import LOAD_DATASET
|
||||||
|
from opencompass.utils import get_data_path
|
||||||
|
|
||||||
from .base import BaseDataset
|
from .base import BaseDataset
|
||||||
|
|
||||||
@ -9,9 +10,9 @@ from .base import BaseDataset
|
|||||||
class PubMedQADataset(BaseDataset):
|
class PubMedQADataset(BaseDataset):
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def load_single():
|
def load_single(path):
|
||||||
dataset = []
|
dataset = []
|
||||||
ds = load_dataset('qiaojin/PubMedQA', 'pqa_labeled')
|
ds = load_dataset(path, 'pqa_labeled')
|
||||||
for data in ds['train']:
|
for data in ds['train']:
|
||||||
data['question'] = (f"CONTEXTS: {data['context']}\n"
|
data['question'] = (f"CONTEXTS: {data['context']}\n"
|
||||||
f"QUESTION: {data['question']}")
|
f"QUESTION: {data['question']}")
|
||||||
@ -30,10 +31,6 @@ class PubMedQADataset(BaseDataset):
|
|||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def load(path):
|
def load(path):
|
||||||
train_dataset = Dataset.from_list([])
|
path = get_data_path(path)
|
||||||
val_dataset = PubMedQADataset.load_single()
|
dataset = PubMedQADataset.load_single(path)
|
||||||
dataset = DatasetDict({
|
|
||||||
'train': train_dataset,
|
|
||||||
'validation': val_dataset
|
|
||||||
})
|
|
||||||
return dataset
|
return dataset
|
||||||
|
@ -1,6 +1,7 @@
|
|||||||
from datasets import Dataset, DatasetDict, load_dataset
|
from datasets import Dataset, load_dataset
|
||||||
|
|
||||||
from opencompass.registry import LOAD_DATASET
|
from opencompass.registry import LOAD_DATASET
|
||||||
|
from opencompass.utils import get_data_path
|
||||||
|
|
||||||
from .base import BaseDataset
|
from .base import BaseDataset
|
||||||
|
|
||||||
@ -9,9 +10,9 @@ from .base import BaseDataset
|
|||||||
class ScienceQADataset(BaseDataset):
|
class ScienceQADataset(BaseDataset):
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def load_single():
|
def load_single(path):
|
||||||
dataset = []
|
dataset = []
|
||||||
ds = load_dataset('derek-thomas/ScienceQA')
|
ds = load_dataset(path)
|
||||||
for data in ds['test']:
|
for data in ds['test']:
|
||||||
if data['image'] is None:
|
if data['image'] is None:
|
||||||
data['label'] = chr(65 + data['answer']
|
data['label'] = chr(65 + data['answer']
|
||||||
@ -28,10 +29,6 @@ class ScienceQADataset(BaseDataset):
|
|||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def load(path):
|
def load(path):
|
||||||
train_dataset = Dataset.from_list([])
|
path = get_data_path(path)
|
||||||
val_dataset = ScienceQADataset.load_single()
|
dataset = ScienceQADataset.load_single(path)
|
||||||
dataset = DatasetDict({
|
|
||||||
'train': train_dataset,
|
|
||||||
'validation': val_dataset
|
|
||||||
})
|
|
||||||
return dataset
|
return dataset
|
||||||
|
@ -446,6 +446,21 @@ DATASETS_MAPPING = {
|
|||||||
"hf_id": "",
|
"hf_id": "",
|
||||||
"local": "./data/ChemBench4K",
|
"local": "./data/ChemBench4K",
|
||||||
},
|
},
|
||||||
|
"opencompass/ClinicBench": {
|
||||||
|
"ms_id": "",
|
||||||
|
"hf_id": "xuxuxuxuxu/Pharmacology-QA",
|
||||||
|
"local": "",
|
||||||
|
},
|
||||||
|
"opencompass/ScienceQA": {
|
||||||
|
"ms_id": "",
|
||||||
|
"hf_id": "derek-thomas/ScienceQA",
|
||||||
|
"local": "",
|
||||||
|
},
|
||||||
|
"opencompass/PubMedQA": {
|
||||||
|
"ms_id": "",
|
||||||
|
"hf_id": "qiaojin/PubMedQA",
|
||||||
|
"local": "",
|
||||||
|
},
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user