"test/git@developer.sourcefind.cn:zhaoyu6/sglang.git" did not exist on "de9217334b28f9a1d9e3ab7c9a249abd4f71730b"
Commit 79545adb authored by Benjamin Fattori's avatar Benjamin Fattori
Browse files

Merge remote-tracking branch 'upstream/big-refactor' into seq2seq-refactor

parents eb7b9095 761f0087
import re import re
def wikitext_detokenizer(doc): def wikitext_detokenizer(doc):
string = doc["page"] string = doc["page"]
# contractions # contractions
......
group: group:
- wikitext_group - wikitext_group
task: wikitext_yaml task: default
dataset_path: EleutherAI/wikitext_document_level dataset_path: EleutherAI/wikitext_document_level
dataset_name: wikitext-2-raw-v1 dataset_name: wikitext-2-raw-v1
output_type: loglikelihood_rolling output_type: loglikelihood_rolling
...@@ -14,11 +14,5 @@ should_decontaminate: true ...@@ -14,11 +14,5 @@ should_decontaminate: true
doc_to_decontamination_query: "{{page}}" doc_to_decontamination_query: "{{page}}"
metric_list: metric_list:
- metric: word_perplexity - metric: word_perplexity
aggregation: weighted_perplexity
higher_is_better: false
- metric: byte_perplexity - metric: byte_perplexity
aggregation: weighted_perplexity
higher_is_better: false
- metric: bits_per_byte - metric: bits_per_byte
aggregation: bits_per_byte
higher_is_better: false
\ No newline at end of file
...@@ -157,22 +157,32 @@ def make_table(result_dict): ...@@ -157,22 +157,32 @@ def make_table(result_dict):
md_writer = MarkdownTableWriter() md_writer = MarkdownTableWriter()
latex_writer = LatexTableWriter() latex_writer = LatexTableWriter()
md_writer.headers = ["Task", "Version", "Metric", "Value", "", "Stderr"] md_writer.headers = ["Task", "Version", "Filter", "Metric", "Value", "", "Stderr"]
latex_writer.headers = ["Task", "Version", "Metric", "Value", "", "Stderr"] latex_writer.headers = [
"Task",
"Version",
"Filter",
"Metric",
"Value",
"",
"Stderr",
]
values = [] values = []
for k, dic in result_dict["results"].items(): for k, dic in result_dict["results"].items():
version = result_dict["versions"][k] version = result_dict["versions"][k]
for m, v in dic.items(): for (mf), v in dic.items():
m, _, f = mf.partition(",")
print(m, f)
if m.endswith("_stderr"): if m.endswith("_stderr"):
continue continue
if m + "_stderr" in dic: if m + "_stderr" + "," + f in dic:
se = dic[m + "_stderr"] se = dic[m + "_stderr" + "," + f]
values.append([k, version, m, "%.4f" % v, "±", "%.4f" % se]) values.append([k, version, f, m, "%.4f" % v, "±", "%.4f" % se])
else: else:
values.append([k, version, m, "%.4f" % v, "", ""]) values.append([k, version, f, m, "%.4f" % v, "", ""])
k = "" k = ""
version = "" version = ""
md_writer.value_matrix = values md_writer.value_matrix = values
......
...@@ -19,7 +19,9 @@ class MultiChoice: ...@@ -19,7 +19,9 @@ class MultiChoice:
for value in values.split(","): for value in values.split(","):
if len(fnmatch.filter(self.choices, value)) == 0: if len(fnmatch.filter(self.choices, value)) == 0:
eval_logger.warning("{} is not in task list.".format(value)) eval_logger.warning("{} is not in task list.".format(value))
# eval_logger.info(f"{choices} is this") eval_logger.info(f"Available tasks to choose:")
for choice in self.choices:
eval_logger.info(f" {choice}")
return True return True
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment