Commit 6998762a authored by lintangsutawika's avatar lintangsutawika
Browse files

merged cont-metrics here

parent 2184b8de
...@@ -109,9 +109,9 @@ def ter(items): ...@@ -109,9 +109,9 @@ def ter(items):
@register_aggregation("brier_score") @register_aggregation("brier_score")
def brier_score(items): # This is a passthrough function def brier_score(items): # This is a passthrough function
gold, predictions = list(zip(*items)) gold, predictions = list(zip(*items))
gold = list(gold) gold = np.array(gold)
gold_one_hot = np.eye(np.max(gold) + 1)[gold] predictions = np.array(predictions)
predictions = list(zip(*items))[1] gold_one_hot = np.eye(len(predictions[0]))[gold]
return np.mean(np.sum((predictions - gold_one_hot) ** 2, axis=1)) return np.mean(np.sum((predictions - gold_one_hot) ** 2, axis=1))
......
...@@ -468,6 +468,8 @@ def evaluate( ...@@ -468,6 +468,8 @@ def evaluate(
if stderr is not None: if stderr is not None:
results[task_name][metric + "_stderr" + "," + key] = stderr(items) results[task_name][metric + "_stderr" + "," + key] = stderr(items)
else:
results[task_name][metric + "_stderr" + "," + key] = 0
if bool(results): if bool(results):
......
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
...@@ -10,6 +10,4 @@ metric_list: ...@@ -10,6 +10,4 @@ metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
- metric: acc_norm - metric: brier_score
aggregation: mean
higher_is_better: true
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment