group: - pile task: pile_github dataset_path: EleutherAI/the_pile dataset_name: pile_github output_type: loglikelihood_rolling test_split: train template_aliases: "" doc_to_text: "" doc_to_target: "{{text}}" should_decontaminate: true doc_to_decontamination_query: "{{text}}" metric_list: - metric: word_perplexity aggregation: weighted_perplexity higher_is_better: false - metric: byte_perplexity aggregation: weighted_perplexity higher_is_better: false - metric: bits_per_byte aggregation: bits_per_byte higher_is_better: false