format

135b41ce · lintangsutawika · 0436b5d6 · 135b41ce
Commit 135b41ce authored Aug 15, 2023 by lintangsutawika
Show whitespace changes
Inline Side-by-side

Showing with 23 additions and 21 deletions

lm_eval/tasks/truthfulqa/utils.py lm_eval/tasks/truthfulqa/utils.py +23 -21

No files found.
--- a/lm_eval/tasks/truthfulqa/utils.py
+++ b/lm_eval/tasks/truthfulqa/utils.py
@@ -4,6 +4,7 @@ import numpy as np
 from rouge_score import rouge_scorer, scoring
 def process_results_mc2(doc, results):
    lls, is_greedy = zip(*results)
@@ -24,7 +25,6 @@ def process_docs_gen(dataset: datasets.Dataset) -> datasets.Dataset:
 def preprocess_function(examples):
    def _format_answers(answers):
        formatted_answers = []
        for answer in answers:
@@ -142,6 +142,7 @@ def bleu(refs, preds):
    ).score
    return score
 def rouge(refs, preds):
    """
    Returns `t5` style ROUGE scores. See the related implementation:
@@ -169,6 +170,7 @@ def rouge(refs, preds):
    result = aggregator.aggregate()
    return {type: result[type].mid.fmeasure * 100 for type in rouge_types}
 # def bleurt_max(predictions, references):
 #     pass