Commit b0597a94 authored by lintangsutawika's avatar lintangsutawika
Browse files

adjustments for super_glue

parent ee633332
...@@ -23,6 +23,7 @@ from lm_eval.api.filter import FilterEnsemble ...@@ -23,6 +23,7 @@ from lm_eval.api.filter import FilterEnsemble
from lm_eval.logger import eval_logger from lm_eval.logger import eval_logger
from lm_eval.prompts import get_prompt from lm_eval.prompts import get_prompt
from lm_eval.filters import build_filter_ensemble from lm_eval.filters import build_filter_ensemble
from lm_eval.metrics import metric_max_over_ground_truths
from lm_eval.api.metrics import ( from lm_eval.api.metrics import (
mean, mean,
weighted_perplexity, weighted_perplexity,
......
...@@ -8,7 +8,7 @@ training_split: train ...@@ -8,7 +8,7 @@ training_split: train
validation_split: validation validation_split: validation
doc_to_text: "{{passage}}\nQuestion: {{question}}?\nAnswer:" doc_to_text: "{{passage}}\nQuestion: {{question}}?\nAnswer:"
doc_to_target: label doc_to_target: label
doc_to_choice: {0: "no", 1: "yes"} doc_to_choice: ["no", "yes"]
should_decontaminate: true should_decontaminate: true
doc_to_decontamination_query: passage doc_to_decontamination_query: passage
metric_list: metric_list:
......
...@@ -8,6 +8,6 @@ training_split: train ...@@ -8,6 +8,6 @@ training_split: train
validation_split: validation validation_split: validation
doc_to_text: "{{paragraph}}\nQuestion: {{question}}\nAnswer:" doc_to_text: "{{paragraph}}\nQuestion: {{question}}\nAnswer:"
doc_to_target: label doc_to_target: label
doc_to_choice: "[\"{{answer}}\\nIs the answer correct? yes\", \"{{answer}}\\nIs the answer correct? no\"]" doc_to_choice: "['''{{answer}}\\nIs the answer correct? yes''', '''{{answer}}\\nIs the answer correct? no''']"
metric_list: metric_list:
- metric: acc - metric: acc
group: # group:
- super-glue-lm-eval-v1 # - super-glue-lm-eval-v1
task: record task: record
dataset_path: super_glue dataset_path: super_glue
dataset_name: record dataset_name: record
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment