@@ -288,15 +288,20 @@ def read_and_norm_algo_scores(
288
288
algo : read_milestone_from_yaml (dir , algo , milestone )
289
289
for algo in algos
290
290
}
291
+
292
+ task_scores = defaultdict (list )
293
+ for algo in algos :
294
+ for task , scores in algo_scores [algo ].items ():
295
+ task_scores [task ] += scores
296
+
291
297
normalized_algo_scores = deepcopy (algo_scores )
292
- for algo in normalized_algo_scores :
293
- normalized_algo_scores [algo ] = \
294
- {task : norm_func (task , scores )
295
- for task , scores in normalized_algo_scores [algo ].items ()}
296
- for algo , task_scores in algo_scores .items ():
297
- for task , scores in task_scores .items ():
298
- assert np .argmax (algo_scores [algo ][task ]) \
299
- == np .argmax (normalized_algo_scores [algo ][task ])
298
+ for task , scores in task_scores .items ():
299
+ normalized_scores = norm_func (task , scores )
300
+ num_runs = normalized_scores .shape [0 ] // len (algos )
301
+ normalized_scores = \
302
+ normalized_scores .reshape (len (algos ), num_runs , - 1 ).squeeze ()
303
+ for idx , algo in enumerate (normalized_algo_scores ):
304
+ normalized_algo_scores [algo ][task ] = normalized_scores [idx ].tolist ()
300
305
301
306
# num_runs * num_tasks
302
307
algo_scores = \
0 commit comments