From db8d9a9798a60891bd4ca77c1f43d444b5aa6e86 Mon Sep 17 00:00:00 2001
From: Shiyao Ma <mashiyao@patsnap.com>
Date: Wed, 22 May 2024 11:28:09 +0800
Subject: [PATCH 1/2] change max_task_size to dynamic

---
 opencompass/partitioners/size.py | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/opencompass/partitioners/size.py b/opencompass/partitioners/size.py
index 10e64a2f..56659ca0 100644
--- a/opencompass/partitioners/size.py
+++ b/opencompass/partitioners/size.py
@@ -91,6 +91,25 @@ class SizePartitioner(BasePartitioner):
                                       key=lambda x: self.get_cost(x),
                                       reverse=True)
             for model in comb['models']:
+                # modified here, in order to maximize utilization of GPUs,
+                # change the CONSTANT max_task_size parameter to DYNAMIC based on model configuration
+                # if the model requires X gpu,
+                # available gpu is Y
+                # then there must be at least Y // X levels of parallelization, then max_task_size must produce at least Y // X tasks
+                X = model['run_cfg']['num_gpus']
+                Y = torch.cuda.device_count()
+                min_num_parallel_tasks = Y // X
+                if min_num_parallel_tasks > 1:
+                    num_datasets = len(model_dataset_combinations[0]['datasets'])
+                    total_estimated_size = num_datasets * \
+                        min(
+                            model['batch_size'],
+                            sum([ele['num_repeats_per_file'] for ele in model_dataset_combinations[0]['datasets']]) //
+                                len([ele['num_repeats_per_file'] for ele in model_dataset_combinations[0]['datasets']])
+                        ) * \
+                        self.gen_task_coef
+                    self.max_task_size = total_estimated_size // min_num_parallel_tasks - 1
+
                 chunks = []  # elements: tuple(size, dataset_chunk)
                 for dataset in comb['datasets']:
                     filename = get_infer_output_path(model, dataset, out_dir)

From 78e89ce8b5610a71005e14a3b7df20d1fd7321d1 Mon Sep 17 00:00:00 2001
From: disperaller <jasond.msy@gmail.com>
Date: Wed, 22 May 2024 13:55:05 +0800
Subject: [PATCH 2/2] change max_task_size to dynamic value

---
 opencompass/partitioners/size.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/opencompass/partitioners/size.py b/opencompass/partitioners/size.py
index 56659ca0..3efba82a 100644
--- a/opencompass/partitioners/size.py
+++ b/opencompass/partitioners/size.py
@@ -1,6 +1,7 @@
 import copy
 import math
 import os.path as osp
+import torch
 from fnmatch import fnmatch
 from typing import Dict, List, Optional, Tuple, Union