Unverified Commit ad506a13 authored by Baber Abbasi's avatar Baber Abbasi Committed by GitHub
Browse files

remove duplicate tags/groups (#3343)

parent d5ddccd9
group: longbench2 group: longbench2
task: task:
- longbench2_history - longbench2_history_tasks
- longbench2_incontext - longbench2_incontext_tasks
- longbench2_multi - longbench2_multi_tasks
- longbench2_single - longbench2_single_tasks
- longbench2_structured - longbench2_structured_tasks
- longbench2_code - longbench2_code
aggregate_metric_list: aggregate_metric_list:
- metric: acc - metric: acc
......
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_multi - longbench2_multi_tasks
task: longbench2_academic_multi task: longbench2_academic_multi
dataset_name: academic_multi dataset_name: academic_multi
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_single - longbench2_single_tasks
task: longbench2_academic_single task: longbench2_academic_single
dataset_name: academic_single dataset_name: academic_single
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_history - longbench2_history_tasks
task: longbench2_agent_history task: longbench2_agent_history
dataset_name: agent_history_qa dataset_name: agent_history_qa
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_single - longbench2_single_tasks
task: longbench2_detective task: longbench2_detective
dataset_name: detective dataset_name: detective
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_history - longbench2_history_tasks
task: longbench2_dialogue_history task: longbench2_dialogue_history
dataset_name: dialogue_history_qa dataset_name: dialogue_history_qa
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_single - longbench2_single_tasks
task: longbench2_event_order task: longbench2_event_order
dataset_name: event_ordering dataset_name: event_ordering
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_multi - longbench2_multi_tasks
task: longbench2_fin_multi task: longbench2_fin_multi
dataset_name: financial_multi dataset_name: financial_multi
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_single - longbench2_single_tasks
task: longbench2_fin_single task: longbench2_fin_single
dataset_name: financial_single dataset_name: financial_single
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_multi - longbench2_multi_tasks
task: longbench2_govt_multi task: longbench2_govt_multi
dataset_name: government_multi dataset_name: government_multi
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_single - longbench2_single_tasks
task: longbench2_govt_single task: longbench2_govt_single
dataset_name: government_single dataset_name: government_single
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_structured - longbench2_structured_tasks
task: longbench2_graph task: longbench2_graph
dataset_name: graph_reasoning dataset_name: graph_reasoning
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_multi - longbench2_multi_tasks
task: longbench2_legal_multi task: longbench2_legal_multi
dataset_name: legal_multi dataset_name: legal_multi
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_single - longbench2_single_tasks
task: longbench2_legal_single task: longbench2_legal_single
dataset_name: legal_single dataset_name: legal_single
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_single - longbench2_single_tasks
task: longbench2_lit_single task: longbench2_lit_single
dataset_name: literary dataset_name: literary
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
task: longbench2_code task: longbench2_code
dataset_name: code_repo_qa dataset_name: code_repo_qa
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_incontext - longbench2_incontext_tasks
task: longbench2_many_shot task: longbench2_many_shot
dataset_name: manyshot_learning dataset_name: manyshot_learning
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_multi - longbench2_multi_tasks
task: longbench2_news_multi task: longbench2_news_multi
dataset_name: multinews dataset_name: multinews
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_structured - longbench2_structured_tasks
task: longbench2_table task: longbench2_table
dataset_name: table_qa dataset_name: table_qa
include: _longbench_common_yaml include: _longbench_common_yaml
tag: tag:
- longbench2 - longbench2_tasks
- longbench2_incontext - longbench2_incontext_tasks
task: longbench2_translate task: longbench2_translate
dataset_name: new_language_translation dataset_name: new_language_translation
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment