Commit 2493c6cc authored by lintangsutawika's avatar lintangsutawika
Browse files

changed default to 5-shot

parent f2c396ab
...@@ -3,10 +3,11 @@ task: ...@@ -3,10 +3,11 @@ task:
# BBH # BBH
- bbh_flan_zeroshot - bbh_flan_zeroshot
- bbh_flan_fewshot - bbh_flan_fewshot
# - bbh_flan_cot_fewshot - bbh_flan_cot_fewshot
# - bbh_flan_cot_zeroshot - bbh_flan_cot_zeroshot
# MMLU # MMLU
- mmlu
- mmlu_flan_n_shot_generative - mmlu_flan_n_shot_generative
- mmlu_flan_n_shot_loglikelihood - mmlu_flan_n_shot_loglikelihood
# - mmlu_flan_cot_zeroshot - mmlu_flan_cot_zeroshot
# - mmlu_flan_cot_fewshot - mmlu_flan_cot_fewshot
...@@ -15,3 +15,4 @@ metric_list: ...@@ -15,3 +15,4 @@ metric_list:
- metric: acc_norm - metric: acc_norm
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
num_fewshot: 5
...@@ -12,3 +12,4 @@ metric_list: ...@@ -12,3 +12,4 @@ metric_list:
- metric: exact_match - metric: exact_match
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
num_fewshot: 5
...@@ -13,3 +13,4 @@ metric_list: ...@@ -13,3 +13,4 @@ metric_list:
- metric: acc_norm - metric: acc_norm
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
num_fewshot: 5
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment