OpenCompass/opencompass/datasets/lmeval.py

from typing import List, Optional

from datasets import Dataset, DatasetDict

from opencompass.datasets import BaseDataset


class LMEvalDataset(BaseDataset):
    """A dataset wrapper around the evaluator inputs, designed for
    OpenCompass's internal use."""

    @staticmethod
    def load(predictions: List, references: Optional[List] = None):
        content = {'prediction': predictions}
        if references:
            content['reference'] = references
        return DatasetDict(dict(test=Dataset.from_dict(content)))
[Sync] Initial support of subjective evaluation (#421) Co-authored-by: Leymore <zfz-960727@163.com> 2023-09-22 15:42:31 +08:00			`from typing import List, Optional`

			`from datasets import Dataset, DatasetDict`

			`from opencompass.datasets import BaseDataset`


			`class LMEvalDataset(BaseDataset):`
			`"""A dataset wrapper around the evaluator inputs, designed for`
			`OpenCompass's internal use."""`

			`@staticmethod`
			`def load(predictions: List, references: Optional[List] = None):`
			`content = {'prediction': predictions}`
			`if references:`
			`content['reference'] = references`
			`return DatasetDict(dict(test=Dataset.from_dict(content)))`