[Fix] SubSizePartition fix (#746)

* fix subjective_eval * subject_eval partition situation fixed * subject_eval partition situation fixed
2025-05-30 16:03:24 +08:00 · 2023-12-28 11:46:46 +08:00 · 2023-12-28 11:46:46 +08:00 · db919f0191
commit db919f0191
parent 0a525985e8
1 changed files with 58 additions and 29 deletions
--- a/opencompass/tasks/subjective_eval.py
+++ b/opencompass/tasks/subjective_eval.py
@ -97,23 +97,42 @@ class SubjectiveEvalTask(BaseTask):
                for m in model_cfg
            ]
        # Load predictions
        filename = get_infer_output_path(
            model_cfg, dataset_cfg, osp.join(self.work_dir, 'predictions'))
        # in case the prediction is partial
        root, ext = osp.splitext(filename)
        partial_filename = root + '_0' + ext
        pred_strs = None
        # There will be 5 situations, so we need to deal with them
        # 1.There are no partitions in infer and judge stage
        # 2.No partition in infer stage, but use partition in judge stage
        # 3.Use partition in infer stage, but not use partition in judge stage
        # 4.Use both partition, with same partition size
        # 5.Use both partition, but different partition size
        # If take SubjectSizePartition, get new filename without _0
        if 'test_range' in dataset_cfg['reader_cfg']:
            filename = get_infer_output_path(
                model_cfg, dataset_cfg, osp.join(self.work_dir, 'predictions'))
            root, ext = osp.splitext(filename)
            filename = root[:-2] + ext
        # If take SubjectNaivePartition, get filename
        else:
            filename = get_infer_output_path(
                model_cfg, dataset_cfg, osp.join(self.work_dir, 'predictions'))
        # Get partition name
        root, ext = osp.splitext(filename)
        partial_filename = root + '_0' + ext
        # If no predictions get in predictions dir
        if not osp.exists(osp.realpath(filename)) and not osp.exists(
                osp.realpath(partial_filename)):
            return {'error': 'No predictions found.'}
        else:
            # If use Naive partition in infer stage
            if osp.exists(osp.realpath(filename)):
                preds = mmengine.load(filename)
                pred_strs = [
                    preds[str(i)]['prediction'] for i in range(len(preds))
                ]
            # If use Size partition in infer stage
            else:
                filename = partial_filename
                pred_strs = []
@ -125,31 +144,41 @@ class SubjectiveEvalTask(BaseTask):
                    pred_strs += [
                        preds[str(i)]['prediction'] for i in range(len(preds))
                    ]
        # Get all predictions in pred_strs
-            if ('pred_role' in eval_cfg and 'meta_template' in model_cfg
+        # If take SubjectSizePartition, get new pred_strs based on test_range
-                    and not MODELS.get(model_cfg['type']).is_api):
+        if 'test_range' in dataset_cfg['reader_cfg']:
-                # Create a prompt template for role config parsing
+            test_range = dataset_cfg['reader_cfg']['test_range']
-                from opencompass.models.base import LMTemplateParser
+            pred_strs = eval('pred_strs' + test_range)
-                parser = LMTemplateParser(model_cfg['meta_template'])
+        # If take SubjectNaivePartition, get all pred_strs
-                role = parser.roles[eval_cfg['pred_role']]
+        else:
-                pred_strs = [
+            pred_strs = pred_strs
-                    self._extract_role_pred(pred, role.get('begin', None),
+
-                                            role.get('end', None))
+        if ('pred_role' in eval_cfg and 'meta_template' in model_cfg
-                    for pred in pred_strs
+                and not MODELS.get(model_cfg['type']).is_api):
-                ]
+            # Create a prompt template for role config parsing
            from opencompass.models.base import LMTemplateParser
            parser = LMTemplateParser(model_cfg['meta_template'])
            role = parser.roles[eval_cfg['pred_role']]
            pred_strs = [
                self._extract_role_pred(pred, role.get('begin', None),
                                        role.get('end', None))
                for pred in pred_strs
            ]
        # Postprocess predictions if necessary
        ds_abbr = dataset_abbr_from_cfg(dataset_cfg)
        model_postprocessors = model_cfg.get('pred_postprocessor', {})
        pred_postprocessor = None
        for pattern in model_postprocessors.keys():
            if fnmatch.fnmatch(ds_abbr, pattern):
                pred_postprocessor = model_postprocessors[pattern]
                break
        if 'pred_postprocessor' in eval_cfg or pred_postprocessor:
            kwargs = pred_postprocessor or eval_cfg['pred_postprocessor']
            proc = TEXT_POSTPROCESSORS.get(kwargs.pop('type'))
            pred_strs = [proc(s, **kwargs) for s in pred_strs]
            # Postprocess predictions if necessary
            ds_abbr = dataset_abbr_from_cfg(dataset_cfg)
            model_postprocessors = model_cfg.get('pred_postprocessor', {})
            pred_postprocessor = None
            for pattern in model_postprocessors.keys():
                if fnmatch.fnmatch(ds_abbr, pattern):
                    pred_postprocessor = model_postprocessors[pattern]
                    break
            if 'pred_postprocessor' in eval_cfg or pred_postprocessor:
                kwargs = pred_postprocessor or eval_cfg['pred_postprocessor']
                proc = TEXT_POSTPROCESSORS.get(kwargs.pop('type'))
                pred_strs = [proc(s, **kwargs) for s in pred_strs]
        return {
            'model_name': model_abbr_from_cfg(model_cfg),
            'model_preds': pred_strs