process aggregate fix

0eb94c8b · lintangsutawika · b2598de8 · 0eb94c8b
Commit 0eb94c8b authored Aug 01, 2023 by lintangsutawika
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 4 deletions

lm_eval/evaluator.py lm_eval/evaluator.py +1 -4

No files found.
--- a/lm_eval/evaluator.py
+++ b/lm_eval/evaluator.py
@@ -386,9 +386,6 @@ def evaluate(
            task_score = task.aggregation()[metric](items)
            results[task_name][metric + "," + key] = task_score

-            # if task_name not in benchmark_agg:
-            #     benchmark[] = [task_score]
-
            # Need to put back in results
            # pythia | acc
            #        | perplexity
@@ -415,7 +412,7 @@ def evaluate(
                if stderr is not None:
                    results[task_name][metric + "_stderr" + "," + key] = stderr(items)

-        if not bool(aggregate):
+        if bool(aggregate):
            for group in aggregate.keys():
                for metric in aggregate[group].keys():
                    aggregate[group][metric] = np.average(aggregate[group][metric])