Commit a0787a9f authored by baberabb's avatar baberabb
Browse files

Merge remote-tracking branch 'origin/big-refactor' into big-refactor_dp

parents 6359f083 dc5b3d5d
......@@ -27,3 +27,5 @@ metric_list:
higher_is_better: true
ignore_case: true
ignore_punctuation: true
metadata:
- version: 2.0
......@@ -75,3 +75,5 @@ metric_list:
- metric: rougeL_diff
aggregation: mean
higher_is_better: true
metadata:
- version: 2.0
......@@ -32,3 +32,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 2.0
......@@ -9,3 +9,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 2.0
......@@ -16,3 +16,5 @@ metric_list:
higher_is_better: true
ignore_case: false
ignore_punctuation: false
metadata:
- version: 1.0
......@@ -16,3 +16,5 @@ metric_list:
higher_is_better: true
ignore_case: false
ignore_punctuation: false
metadata:
- version: 1.0
......@@ -16,3 +16,5 @@ metric_list:
higher_is_better: true
ignore_case: false
ignore_punctuation: false
metadata:
- version: 1.0
......@@ -16,3 +16,5 @@ metric_list:
higher_is_better: true
ignore_case: false
ignore_punctuation: false
metadata:
- version: 1.0
......@@ -16,3 +16,5 @@ metric_list:
higher_is_better: true
ignore_case: false
ignore_punctuation: false
metadata:
- version: 1.0
......@@ -16,3 +16,5 @@ metric_list:
- metric: exact_match
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -14,3 +14,5 @@ metric_list:
- metric: word_perplexity
- metric: byte_perplexity
- metric: bits_per_byte
metadata:
- version: 2.0
......@@ -13,3 +13,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -15,3 +15,5 @@ metric_list:
- metric: !function metrics.bleu
aggregation: !function metrics.agg_bleu
higher_is_better: true
metadata:
- version: 0.0
......@@ -13,3 +13,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -10,3 +10,5 @@ doc_to_target: label
doc_to_choice: !function utils.doc_to_choice
metric_list:
- metric: acc
metadata:
- version: 1.0
......@@ -15,3 +15,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -14,3 +14,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -16,3 +16,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -339,31 +339,27 @@ def make_table(result_dict, column: str = "results"):
elif column == "groups":
column_name = "Groups"
md_writer = MarkdownTableWriter()
latex_writer = LatexTableWriter()
md_writer.headers = [
column_name,
"Version",
"Filter",
"Metric",
"Value",
"",
"Stderr",
]
latex_writer.headers = [
all_headers = [
column_name,
"Version",
"Filter",
"n-shot",
"Metric",
"Value",
"",
"Stderr",
]
md_writer = MarkdownTableWriter()
latex_writer = LatexTableWriter()
md_writer.headers = all_headers
latex_writer.headers = all_headers
values = []
for k, dic in result_dict[column].items():
version = result_dict["versions"][k]
n = str(result_dict["n-shot"][k])
if "alias" in dic:
k = dic.pop("alias")
......@@ -375,9 +371,9 @@ def make_table(result_dict, column: str = "results"):
if m + "_stderr" + "," + f in dic:
se = dic[m + "_stderr" + "," + f]
values.append([k, version, f, m, "%.4f" % v, "±", "%.4f" % se])
values.append([k, version, f, n, m, "%.4f" % v, "±", "%.4f" % se])
else:
values.append([k, version, f, m, "%.4f" % v, "", ""])
values.append([k, version, f, n, m, "%.4f" % v, "", ""])
k = ""
version = ""
md_writer.value_matrix = values
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment