2023-07-05 10:33:12 +08:00
|
|
|
from typing import Dict, Optional, Union
|
|
|
|
|
|
|
|
from datasets import Dataset, DatasetDict
|
|
|
|
|
|
|
|
from opencompass.openicl import DatasetReader
|
|
|
|
|
|
|
|
|
|
|
|
class BaseDataset:
|
|
|
|
|
|
|
|
def __init__(self, reader_cfg: Optional[Dict] = {}, **kwargs):
|
|
|
|
self.dataset = self.load(**kwargs)
|
|
|
|
self._init_reader(**reader_cfg)
|
|
|
|
|
|
|
|
def _init_reader(self, **kwargs):
|
|
|
|
self.reader = DatasetReader(self.dataset, **kwargs)
|
|
|
|
|
|
|
|
@property
|
|
|
|
def train(self):
|
|
|
|
return self.reader.dataset['train']
|
|
|
|
|
|
|
|
@property
|
|
|
|
def test(self):
|
|
|
|
return self.reader.dataset['test']
|
|
|
|
|
2025-02-25 20:34:41 +08:00
|
|
|
@staticmethod
|
2023-07-05 10:33:12 +08:00
|
|
|
def load(**kwargs) -> Union[Dataset, DatasetDict]:
|
|
|
|
pass
|