Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
37a46351
Commit
37a46351
authored
Nov 28, 2023
by
lintangsutawika
Browse files
reformat
parent
525afc17
Changes
122
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
20 additions
and
20 deletions
+20
-20
lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml
lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml
+1
-1
lm_eval/tasks/hendrycks_ethics/utilitarianism_original_yaml
lm_eval/tasks/hendrycks_ethics/utilitarianism_original_yaml
+1
-1
lm_eval/tasks/hendrycks_ethics/virtue.yaml
lm_eval/tasks/hendrycks_ethics/virtue.yaml
+1
-1
lm_eval/tasks/lambada/lambada_openai.yaml
lm_eval/tasks/lambada/lambada_openai.yaml
+1
-1
lm_eval/tasks/lambada/lambada_standard.yaml
lm_eval/tasks/lambada/lambada_standard.yaml
+1
-1
lm_eval/tasks/lambada_cloze/lambada_openai_cloze.yaml
lm_eval/tasks/lambada_cloze/lambada_openai_cloze.yaml
+1
-1
lm_eval/tasks/lambada_cloze/lambada_standard_cloze.yaml
lm_eval/tasks/lambada_cloze/lambada_standard_cloze.yaml
+1
-1
lm_eval/tasks/lambada_multilingual/lambada_mt_en.yaml
lm_eval/tasks/lambada_multilingual/lambada_mt_en.yaml
+1
-1
lm_eval/tasks/logiqa/logiqa.yaml
lm_eval/tasks/logiqa/logiqa.yaml
+1
-1
lm_eval/tasks/logiqa2/logieval.yaml
lm_eval/tasks/logiqa2/logieval.yaml
+1
-1
lm_eval/tasks/logiqa2/logiqa2.yaml
lm_eval/tasks/logiqa2/logiqa2.yaml
+1
-1
lm_eval/tasks/mathqa/mathqa.yaml
lm_eval/tasks/mathqa/mathqa.yaml
+1
-1
lm_eval/tasks/mc_taco/default.yaml
lm_eval/tasks/mc_taco/default.yaml
+1
-1
lm_eval/tasks/mgsm/direct/direct_yaml
lm_eval/tasks/mgsm/direct/direct_yaml
+1
-1
lm_eval/tasks/mgsm/en_cot/cot_yaml
lm_eval/tasks/mgsm/en_cot/cot_yaml
+1
-1
lm_eval/tasks/mgsm/native_cot/cot_yaml
lm_eval/tasks/mgsm/native_cot/cot_yaml
+1
-1
lm_eval/tasks/minerva_math/minerva_math_algebra.yaml
lm_eval/tasks/minerva_math/minerva_math_algebra.yaml
+1
-1
lm_eval/tasks/mmlu/default/_default_template_yaml
lm_eval/tasks/mmlu/default/_default_template_yaml
+1
-1
lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu_flan_cot_fewshot_template_yaml
...mlu/flan_cot_fewshot/_mmlu_flan_cot_fewshot_template_yaml
+1
-1
lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu_flan_cot_zeroshot_template_yaml
...u/flan_cot_zeroshot/_mmlu_flan_cot_zeroshot_template_yaml
+1
-1
No files found.
lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml
View file @
37a46351
...
...
@@ -9,4 +9,4 @@ doc_to_choice: ['no', 'yes']
metric_list
:
-
metric
:
acc
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/hendrycks_ethics/utilitarianism_original_yaml
View file @
37a46351
...
...
@@ -13,4 +13,4 @@
# - metric: acc
# TODO: we want this to be implemented as a winograd_schema task type, actually
# metadata:
# - version: 1.0
\ No newline at end of file
# - version: 1.0
lm_eval/tasks/hendrycks_ethics/virtue.yaml
View file @
37a46351
...
...
@@ -7,4 +7,4 @@ doc_to_text: "Sentence: {{scenario}}\nQuestion: Does the character in this sente
doc_to_target
:
label
doc_to_choice
:
[
'
no'
,
'
yes'
]
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/lambada/lambada_openai.yaml
View file @
37a46351
...
...
@@ -17,4 +17,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/lambada/lambada_standard.yaml
View file @
37a46351
...
...
@@ -18,4 +18,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/lambada_cloze/lambada_openai_cloze.yaml
View file @
37a46351
...
...
@@ -17,4 +17,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/lambada_cloze/lambada_standard_cloze.yaml
View file @
37a46351
...
...
@@ -18,4 +18,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/lambada_multilingual/lambada_mt_en.yaml
View file @
37a46351
...
...
@@ -17,4 +17,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/logiqa/logiqa.yaml
View file @
37a46351
...
...
@@ -18,4 +18,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/logiqa2/logieval.yaml
View file @
37a46351
...
...
@@ -24,4 +24,4 @@ filter_list:
regex_pattern
:
"
^
\\
s*([A-D])"
-
function
:
"
take_first"
metadata
:
-
version
:
0.0
\ No newline at end of file
-
version
:
0.0
lm_eval/tasks/logiqa2/logiqa2.yaml
View file @
37a46351
...
...
@@ -18,4 +18,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
0.0
\ No newline at end of file
-
version
:
0.0
lm_eval/tasks/mathqa/mathqa.yaml
View file @
37a46351
...
...
@@ -19,4 +19,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/mc_taco/default.yaml
View file @
37a46351
...
...
@@ -12,4 +12,4 @@ metric_list:
-
metric
:
acc
-
metric
:
f1
metadata
:
-
version
:
1.0
\ No newline at end of file
-
version
:
1.0
lm_eval/tasks/mgsm/direct/direct_yaml
View file @
37a46351
...
...
@@ -26,4 +26,4 @@ metric_list:
ignore_case: true
ignore_punctuation: true
metadata:
- version: 0.0
\ No newline at end of file
- version: 0.0
lm_eval/tasks/mgsm/en_cot/cot_yaml
View file @
37a46351
...
...
@@ -28,4 +28,4 @@ filter_list:
regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)"
- function: "take_first"
metadata:
- version: 0.0
\ No newline at end of file
- version: 0.0
lm_eval/tasks/mgsm/native_cot/cot_yaml
View file @
37a46351
...
...
@@ -28,4 +28,4 @@ filter_list:
regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)"
- function: "take_first"
metadata:
- version: 1.0
\ No newline at end of file
- version: 1.0
lm_eval/tasks/minerva_math/minerva_math_algebra.yaml
View file @
37a46351
...
...
@@ -20,4 +20,4 @@ metric_list:
aggregation
:
mean
higher_is_better
:
true
metadata
:
-
version
:
0.0
\ No newline at end of file
-
version
:
0.0
lm_eval/tasks/mmlu/default/_default_template_yaml
View file @
37a46351
...
...
@@ -12,4 +12,4 @@ metric_list:
aggregation: mean
higher_is_better: true
metadata:
- version: 0.0
\ No newline at end of file
- version: 0.0
lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu_flan_cot_fewshot_template_yaml
View file @
37a46351
...
...
@@ -22,4 +22,4 @@ metric_list:
ignore_case: true
ignore_punctuation: true
metadata:
- version: 0.0
\ No newline at end of file
- version: 0.0
lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu_flan_cot_zeroshot_template_yaml
View file @
37a46351
...
...
@@ -22,4 +22,4 @@ metric_list:
ignore_case: true
ignore_punctuation: true
metadata:
- version: 0.0
\ No newline at end of file
- version: 0.0
Prev
1
2
3
4
5
6
7
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment