Unverified Commit 19ad7f96 authored by Fengzhe Zhou's avatar Fengzhe Zhou Committed by GitHub
Browse files

fix cmb dataset (#587)

parent 14e6fe6f
...@@ -18,7 +18,6 @@ class CMBDataset(BaseDataset): ...@@ -18,7 +18,6 @@ class CMBDataset(BaseDataset):
for d in val_data: for d in val_data:
d['option_str'] = '\n'.join( d['option_str'] = '\n'.join(
[f'{k}. {v}' for k, v in d['option'].items() if len(v) > 1]) [f'{k}. {v}' for k, v in d['option'].items() if len(v) > 1])
d['answer'] = 'NULL'
val_dataset = Dataset.from_list(val_data) val_dataset = Dataset.from_list(val_data)
with open(osp.join(path, 'test.json'), 'r', encoding='utf-8') as f: with open(osp.join(path, 'test.json'), 'r', encoding='utf-8') as f:
...@@ -26,6 +25,7 @@ class CMBDataset(BaseDataset): ...@@ -26,6 +25,7 @@ class CMBDataset(BaseDataset):
for d in test_data: for d in test_data:
d['option_str'] = '\n'.join( d['option_str'] = '\n'.join(
[f'{k}. {v}' for k, v in d['option'].items() if len(v) > 1]) [f'{k}. {v}' for k, v in d['option'].items() if len(v) > 1])
d['answer'] = 'NULL'
test_dataset = Dataset.from_list(test_data) test_dataset = Dataset.from_list(test_data)
return DatasetDict({'val': val_dataset, 'test': test_dataset}) return DatasetDict({'val': val_dataset, 'test': test_dataset})
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment