Unverified Commit 34561ece authored by philipwangOvO's avatar philipwangOvO Committed by GitHub
Browse files

[Feature] Add InfiniteBench (#739)



* add InfiniteBench

* add InfiniteBench

---------
Co-authored-by: default avatarwangchonghua <wangchonghua@pjlab.org.cn>
parent 3a68083e
from datasets import Dataset
from opencompass.registry import LOAD_DATASET
from ..base import BaseDataset
from .utils import iter_jsonl
@LOAD_DATASET.register_module()
class InfiniteBenchzhqaDataset(BaseDataset):
@staticmethod
def load(path: str):
dataset = list(iter_jsonl(path))
raw_data = []
for item in dataset:
context = item['context']
question = item['input']
answer = item['answer']
raw_data.append({
'context': context,
'question': question,
'answer': answer
})
dataset = Dataset.from_list(raw_data)
return dataset
import json
import re
from opencompass.registry import TEXT_POSTPROCESSORS
def iter_jsonl(path):
with open(path, 'r') as f:
for line in f:
yield json.loads(line)
@TEXT_POSTPROCESSORS.register_module()
def InfiniteBench_first_number_postprocess(text: str) -> str:
first_number = re.search(r'\d+\.\d+|\d+', text)
if first_number is None:
return None
first_number = first_number.group(0).strip()
return str(first_number)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment