Commit 0d03a9f3 authored by lintangsutawika's avatar lintangsutawika
Browse files

add versions

parent bf26d979
......@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4
aggregation: mean
higher_is_better: True
metadata:
- version: 0.0
\ No newline at end of file
......@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4
aggregation: mean
higher_is_better: True
metadata:
- version: 2.0
\ No newline at end of file
......@@ -18,3 +18,5 @@ metric_list:
- metric: f1
aggregation: mean
higher_is_better: true
metadata:
- version: 2.0
\ No newline at end of file
......@@ -19,3 +19,5 @@ metric_list:
- metric: pct_stereotype
aggregation: mean
higher_is_better: false
metadata:
- version: 1.0
\ No newline at end of file
......@@ -13,3 +13,5 @@ metric_list:
- metric: acc_norm
aggregation: mean
higher_is_better: true
metadata:
- version: 0.0
\ No newline at end of file
......@@ -20,3 +20,5 @@ metric_list:
- metric: f1
aggregation: mean
higher_is_better: true
metadata:
- version: 2.0
\ No newline at end of file
......@@ -12,3 +12,5 @@ should_decontaminate: true
doc_to_decontamination_query: sentence
metric_list:
- metric: mcc
metadata:
- version: 1.0
\ No newline at end of file
......@@ -10,3 +10,5 @@ doc_to_target: label
doc_to_choice: ["True", "Neither", "False"]
metric_list:
- metric: acc
metadata:
- version: 1.0
\ No newline at end of file
......@@ -11,3 +11,5 @@ doc_to_choice: ["no", "yes"]
metric_list:
- metric: acc
- metric: f1
metadata:
- version: 1.0
\ No newline at end of file
......@@ -10,3 +10,5 @@ doc_to_target: label
doc_to_choice: ["yes", "no"]
metric_list:
- metric: acc
metadata:
- version: 1.0
\ No newline at end of file
......@@ -12,3 +12,5 @@ doc_to_choice: ["no", "yes"]
metric_list:
- metric: acc
- metric: f1
metadata:
- version: 1.0
\ No newline at end of file
......@@ -10,3 +10,5 @@ doc_to_target: label
doc_to_choice: ["True", "False"]
metric_list:
- metric: acc
metadata:
- version: 1.0
\ No newline at end of file
......@@ -10,3 +10,5 @@ doc_to_target: label
doc_to_choice: ["negative", "positive"]
metric_list:
- metric: acc
metadata:
- version: 1.0
\ No newline at end of file
......@@ -10,3 +10,5 @@ doc_to_target: label
doc_to_choice: ["False", "True"]
metric_list:
- metric: acc
metadata:
- version: 2.0
\ No newline at end of file
......@@ -30,3 +30,5 @@ filter_list:
regex_pattern: "The answer is (\\-?[0-9\\.\\,]*[0-9]+)"
- function: "majority_vote"
- function: "take_first"
metadata:
- version: 0.0
\ No newline at end of file
......@@ -40,3 +40,5 @@ filter_list:
- function: "regex"
regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)."
- function: "take_first"
metadata:
- version: 0.0
\ No newline at end of file
......@@ -33,3 +33,5 @@ filter_list:
- function: "regex"
regex_pattern: "#### (\\-?[0-9\\.\\,]+)"
- function: "take_first"
metadata:
- version: 1.0
\ No newline at end of file
......@@ -19,3 +19,5 @@ metric_list:
- metric: acc_norm
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
\ No newline at end of file
......@@ -18,3 +18,5 @@ metric_list:
- metric: acc_norm
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
\ No newline at end of file
......@@ -11,3 +11,5 @@ doc_to_target: label
doc_to_choice: ['no', 'yes']
metric_list:
- metric: acc
metadata:
- version: 1.0
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment