Commit b58e5556 authored by Baber's avatar Baber
Browse files

Merge branch 'main' into tasklist

# Conflicts:
#	pyproject.toml
parents 6e1866f5 4f8195f1
include: _template_yaml
dataset_name: tpn
task: multiblimp_tpn
include: _template_yaml
dataset_name: ttc
task: multiblimp_ttc
include: _template_yaml
dataset_name: tur
task: multiblimp_tur
include: _template_yaml
dataset_name: uig
task: multiblimp_uig
include: _template_yaml
dataset_name: ukr
task: multiblimp_ukr
include: _template_yaml
dataset_name: urb
task: multiblimp_urb
include: _template_yaml
dataset_name: urd
task: multiblimp_urd
include: _template_yaml
dataset_name: uzb
task: multiblimp_uzb
include: _template_yaml
dataset_name: vep
task: multiblimp_vep
include: _template_yaml
dataset_name: wbp
task: multiblimp_wbp
include: _template_yaml
dataset_name: wol
task: multiblimp_wol
include: _template_yaml
dataset_name: xcl
task: multiblimp_xcl
include: _template_yaml
dataset_name: xnr
task: multiblimp_xnr
include: _template_yaml
dataset_name: xpg
task: multiblimp_xpg
include: _template_yaml
dataset_name: yrl
task: multiblimp_yrl
...@@ -23,5 +23,3 @@ metric_list: ...@@ -23,5 +23,3 @@ metric_list:
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 2.0 version: 2.0
dataset_kwargs:
trust_remote_code: true
...@@ -2,8 +2,6 @@ dataset_path: Helsinki-NLP/tatoeba_mt ...@@ -2,8 +2,6 @@ dataset_path: Helsinki-NLP/tatoeba_mt
training_split: validation training_split: validation
test_split: test test_split: test
output_type: generate_until output_type: generate_until
dataset_kwargs:
trust_remote_code: true
metric_list: metric_list:
- metric: bleu - metric: bleu
higher_is_better: true higher_is_better: true
......
...@@ -12,7 +12,9 @@ try: ...@@ -12,7 +12,9 @@ try:
except (ModuleNotFoundError, ImportError): except (ModuleNotFoundError, ImportError):
raise ModuleNotFoundError( raise ModuleNotFoundError(
"Please install evaluation metrics via pip install evaluate and pip install bert-score", "Please install evaluation metrics via pip install evaluate bert-score "
"rouge_score>=0.1.2 nltk absl-py "
"git+https://github.com/google-research/bleurt.git"
) )
except Exception as e: except Exception as e:
raise RuntimeError( raise RuntimeError(
......
...@@ -19,5 +19,3 @@ metric_list: ...@@ -19,5 +19,3 @@ metric_list:
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 1.0 version: 1.0
dataset_kwargs:
trust_remote_code: true
...@@ -23,5 +23,3 @@ metric_list: ...@@ -23,5 +23,3 @@ metric_list:
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 1.0 version: 1.0
dataset_kwargs:
trust_remote_code: true
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment