feat save_to_station

2025-05-30 16:03:24 +08:00 · 2025-02-27 14:44:24 +00:00 · 2025-02-27 14:44:24 +00:00 · 2aaab41dc9
commit 2aaab41dc9
parent 114cf1366c
3 changed files with 144 additions and 1 deletions
--- a/opencompass/cli/main.py
+++ b/opencompass/cli/main.py
@ -12,7 +12,7 @@ from mmengine.config import Config, DictAction
 from opencompass.registry import PARTITIONERS, RUNNERS, build_from_cfg
 from opencompass.runners import SlurmRunner
 from opencompass.summarizers import DefaultSummarizer
-from opencompass.utils import LarkReporter, get_logger
+from opencompass.utils import LarkReporter, get_logger, Save_To_Station
 from opencompass.utils.run import (fill_eval_cfg, fill_infer_cfg,
                                   get_config_from_arg)

@ -127,6 +127,26 @@ def parse_args():
        'correctness of each sample, bpb, etc.',
        action='store_true',
    )
+    parser.add_argument(
+        '--save-to-station',
+        help='Whether to save the evaluation results to the '
+             'data station.',
+        action='store_true',
+    )
+    parser.add_argument(
+        '--read-station',
+        help='Whether to read the evaluation results from the '
+             'data station.',
+        action='store_true',
+    )
+    parser.add_argument(
+        '--station-path',
+        help='Path to your reuslts station.',
+        type=str,
+        default=None,
+    )
+
+
    # set srun args
    slurm_parser = parser.add_argument_group('slurm_args')
    parse_slurm_args(slurm_parser)
@ -269,6 +289,7 @@ def main():
        content = f'{getpass.getuser()}\'s task has been launched!'
        LarkReporter(cfg['lark_bot_url']).post(content)

+    # infer
    if args.mode in ['all', 'infer']:
        # When user have specified --slurm or --dlc, or have not set
        # "infer" in config, we will provide a default configuration
@ -350,6 +371,15 @@ def main():
        else:
            runner(tasks)

+    # save to station
+    if args.save_to_station:
+        if Save_To_Station(cfg, args):
+            logger.info('Successfully saved to station.')
+        else:
+            logger.warning('Failed to save result to station.')
+
+
+
    # visualize
    if args.mode in ['all', 'eval', 'viz']:
        summarizer_cfg = cfg.get('summarizer', {})
--- a/opencompass/utils/init.py
+++ b/opencompass/utils/init.py
@ -15,3 +15,4 @@ from .network import *  # noqa
 from .postprocessors import *  # noqa
 from .prompt import *  # noqa
 from .text_postprocessors import *  # noqa
+from .result_station import *  # noqa
--- a/opencompass/utils/result_station.py
+++ b/opencompass/utils/result_station.py
@ -0,0 +1,112 @@
+import os
+import os.path as osp
+from typing import List, Tuple, Union
+from mmengine.config import Config
+import json
+import re
+
+
+
+
+
+def Save_To_Station(cfg, args):
+    from dotenv import load_dotenv
+    load_dotenv()
+    station_path = os.getenv('RESULTS_STATION_PATH')
+    assert station_path != None or args.station_path != None
+    station_path = args.station_path if station_path == None else station_path
+
+
+    work_dict = cfg['work_dir']
+    model_list = [i['abbr'] for i in cfg['models']]
+    dataset_list = [i['abbr'] for i in cfg['datasets']]
+
+
+    for dataset in dataset_list:
+        result_path = osp.join(station_path, dataset)
+        if not osp.exists(result_path):
+            os.makedirs(result_path)
+
+        for model in model_list:
+            result_file_name = model + '.json'
+            if osp.exists(osp.join(result_path, result_file_name)):
+                print('result of {} with {} already exists'.format(dataset, model))
+                continue
+            else:
+
+                # get result dict
+                local_result_path = work_dict + '/results/' + model + '/'
+                local_result_json = local_result_path + dataset + '.json'
+                if not osp.exists(local_result_json):
+                    raise ValueError('invalid file: {}'.format(local_result_json))
+                with open(local_result_json, 'r') as f:
+                    this_result = json.load(f)
+                f.close()
+
+                # get prediction list
+                local_prediction_path = work_dict + '/predictions/' + model + '/'
+                local_prediction_regex = rf"^{re.escape(dataset)}(?:_\d+)?\.json$"
+                local_prediction_json = find_files_by_regex(local_prediction_path, local_prediction_regex)
+                if not check_filenames(dataset, local_prediction_json):
+                    raise ValueError('invalid filelist: {}'.format(local_prediction_json))
+
+                this_prediction = []
+                for prediction_json in local_prediction_json:
+                    with open(local_prediction_path + prediction_json, 'r') as f:
+                        this_prediction_load_json = json.load(f)
+                    f.close()
+                    for prekey in this_prediction_load_json.keys():
+                        this_prediction.append(this_prediction_load_json[prekey])
+
+                # dict combine
+                data_model_results = {
+                        'predictions': this_prediction,
+                        'results': this_result
+                }
+                with open(osp.join(result_path, result_file_name), 'w') as f:
+                    json.dump(data_model_results, f, ensure_ascii=False, indent=4)
+                f.close()
+
+    return True
+
+
+def find_files_by_regex(directory, pattern):
+
+    regex = re.compile(pattern)
+
+    matched_files = []
+    for filename in os.listdir(directory):
+        if regex.match(filename):
+            matched_files.append(filename)
+
+    return matched_files
+
+
+def check_filenames(x, filenames):
+
+    if not filenames:
+        return False
+
+    single_pattern = re.compile(rf"^{re.escape(x)}\.json$")
+    numbered_pattern = re.compile(rf"^{re.escape(x)}_(\d+)\.json$")
+
+    is_single = all(single_pattern.match(name) for name in filenames)
+    is_numbered = all(numbered_pattern.match(name) for name in filenames)
+
+    if not (is_single or is_numbered):
+        return False
+
+    if is_single:
+        return len(filenames) == 1
+
+    if is_numbered:
+        numbers = []
+        for name in filenames:
+            match = numbered_pattern.match(name)
+            if match:
+                numbers.append(int(match.group(1)))
+
+        if sorted(numbers) != list(range(len(numbers))):
+            return False
+
+    return True