Commit 835cc40e authored by lintangsutawika's avatar lintangsutawika
Browse files

merged latest and added altworld files

parents 8da401e0 c9bbec6e
# Generated by utils.py # Generated by utils.py
dataset_name: tough_vs_raising_2 dataset_name: tough_vs_raising_2
include: template_yaml include: _template_yaml
task: blimp_tough_vs_raising_2 task: blimp_tough_vs_raising_2
# Generated by utils.py # Generated by utils.py
dataset_name: transitive dataset_name: transitive
include: template_yaml include: _template_yaml
task: blimp_transitive task: blimp_transitive
# Generated by utils.py # Generated by utils.py
dataset_name: wh_island dataset_name: wh_island
include: template_yaml include: _template_yaml
task: blimp_wh_island task: blimp_wh_island
# Generated by utils.py # Generated by utils.py
dataset_name: wh_questions_object_gap dataset_name: wh_questions_object_gap
include: template_yaml include: _template_yaml
task: blimp_wh_questions_object_gap task: blimp_wh_questions_object_gap
# Generated by utils.py # Generated by utils.py
dataset_name: wh_questions_subject_gap dataset_name: wh_questions_subject_gap
include: template_yaml include: _template_yaml
task: blimp_wh_questions_subject_gap task: blimp_wh_questions_subject_gap
# Generated by utils.py # Generated by utils.py
dataset_name: wh_questions_subject_gap_long_distance dataset_name: wh_questions_subject_gap_long_distance
include: template_yaml include: _template_yaml
task: blimp_wh_questions_subject_gap_long_distance task: blimp_wh_questions_subject_gap_long_distance
# Generated by utils.py # Generated by utils.py
dataset_name: wh_vs_that_no_gap dataset_name: wh_vs_that_no_gap
include: template_yaml include: _template_yaml
task: blimp_wh_vs_that_no_gap task: blimp_wh_vs_that_no_gap
# Generated by utils.py # Generated by utils.py
dataset_name: wh_vs_that_no_gap_long_distance dataset_name: wh_vs_that_no_gap_long_distance
include: template_yaml include: _template_yaml
task: blimp_wh_vs_that_no_gap_long_distance task: blimp_wh_vs_that_no_gap_long_distance
# Generated by utils.py # Generated by utils.py
dataset_name: wh_vs_that_with_gap dataset_name: wh_vs_that_with_gap
include: template_yaml include: _template_yaml
task: blimp_wh_vs_that_with_gap task: blimp_wh_vs_that_with_gap
# Generated by utils.py # Generated by utils.py
dataset_name: wh_vs_that_with_gap_long_distance dataset_name: wh_vs_that_with_gap_long_distance
include: template_yaml include: _template_yaml
task: blimp_wh_vs_that_with_gap_long_distance task: blimp_wh_vs_that_with_gap_long_distance
...@@ -16,4 +16,4 @@ metric_list: ...@@ -16,4 +16,4 @@ metric_list:
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
metadata: metadata:
version: "1.0" - version: 1.0
...@@ -15,3 +15,5 @@ metric_list: ...@@ -15,3 +15,5 @@ metric_list:
- metric: acc_norm - metric: acc_norm
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
metadata:
- version: 0.0
...@@ -17,3 +17,5 @@ metric_list: ...@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4 - metric: !function bleu.smoothed_bleu_4
aggregation: mean aggregation: mean
higher_is_better: True higher_is_better: True
metadata:
- version: 0.0
...@@ -17,3 +17,5 @@ metric_list: ...@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4 - metric: !function bleu.smoothed_bleu_4
aggregation: mean aggregation: mean
higher_is_better: True higher_is_better: True
metadata:
- version: 0.0
...@@ -17,3 +17,5 @@ metric_list: ...@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4 - metric: !function bleu.smoothed_bleu_4
aggregation: mean aggregation: mean
higher_is_better: True higher_is_better: True
metadata:
- version: 0.0
...@@ -17,3 +17,5 @@ metric_list: ...@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4 - metric: !function bleu.smoothed_bleu_4
aggregation: mean aggregation: mean
higher_is_better: True higher_is_better: True
metadata:
- version: 0.0
...@@ -17,3 +17,5 @@ metric_list: ...@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4 - metric: !function bleu.smoothed_bleu_4
aggregation: mean aggregation: mean
higher_is_better: True higher_is_better: True
metadata:
- version: 0.0
...@@ -17,3 +17,5 @@ metric_list: ...@@ -17,3 +17,5 @@ metric_list:
- metric: !function bleu.smoothed_bleu_4 - metric: !function bleu.smoothed_bleu_4
aggregation: mean aggregation: mean
higher_is_better: True higher_is_better: True
metadata:
- version: 2.0
...@@ -18,3 +18,5 @@ metric_list: ...@@ -18,3 +18,5 @@ metric_list:
- metric: f1 - metric: f1
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
metadata:
- version: 2.0
...@@ -19,3 +19,5 @@ metric_list: ...@@ -19,3 +19,5 @@ metric_list:
- metric: pct_stereotype - metric: pct_stereotype
aggregation: mean aggregation: mean
higher_is_better: false higher_is_better: false
metadata:
- version: 1.0
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment