Commit e184c501 authored by lintangsutawika's avatar lintangsutawika
Browse files

removed " " in make_table

parent ac1a1cef
...@@ -678,7 +678,11 @@ def evaluate( ...@@ -678,7 +678,11 @@ def evaluate(
# results[group][stderr] = lm_eval.api.metrics.combined_sample_stderr(stderrs, sizes, metrics=metrics) # results[group][stderr] = lm_eval.api.metrics.combined_sample_stderr(stderrs, sizes, metrics=metrics)
results[group_or_task]["samples"] = sum(sizes) results[group_or_task]["samples"] = sum(sizes)
versions[group_or_task] = group_config["version"] group_metadata = group_config.get("metadata", None)
if group_metadata is not None:
versions[group_or_task] = group_metadata.get(
"version", None
)
return results, versions, show_group_table, task_aggregation_list return results, versions, show_group_table, task_aggregation_list
results, versions, show_group_table, *_ = process_group( results, versions, show_group_table, *_ = process_group(
......
...@@ -304,16 +304,13 @@ def make_table(result_dict, column: str = "results", sort_results: bool = False) ...@@ -304,16 +304,13 @@ def make_table(result_dict, column: str = "results", sort_results: bool = False)
m, _, f = mf.partition(",") m, _, f = mf.partition(",")
if m.endswith("_stderr"): if m.endswith("_stderr"):
continue continue
if v != " ":
v = "%.4f" % v
hib = HIGHER_IS_BETTER_SYMBOLS.get(higher_is_better.get(m), "") hib = HIGHER_IS_BETTER_SYMBOLS.get(higher_is_better.get(m), "")
if m + "_stderr" + "," + f in dic: if m + "_stderr" + "," + f in dic:
se = dic[m + "_stderr" + "," + f] se = dic[m + "_stderr" + "," + f]
if se != "N/A": se = " N/A" if se == "N/A" else "%.4f" % se
se = "%.4f" % se values.append([k, version, f, n, m, hib, "%.4f" % v, "±", se])
values.append([k, version, f, n, m, hib, v, "±", se])
else: else:
values.append([k, version, f, n, m, hib, v, "", ""]) values.append([k, version, f, n, m, hib, v, "", ""])
k = "" k = ""
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment