"vscode:/vscode.git/clone" did not exist on "bd408076e8d06246d5a88bbb112d02af9be43fa2"
Commit b474a00a authored by quyuan's avatar quyuan
Browse files

update ci

parent 8e21c09d
import zipfile import zipfile
import os import os
import shutil import shutil
import json
import markdown_calculate
code_path = os.environ.get('GITHUB_WORKSPACE') code_path = os.environ.get('GITHUB_WORKSPACE')
#code_path = "/home/quyuan/actions-runner/_work/Magic-PDF/Magic-PDF.bk" #code_path = "/home/quyuan/actions-runner/_work/Magic-PDF/Magic-PDF.bk"
#评测集存放路径 #评测集存放路径
...@@ -34,8 +36,10 @@ def calculate_score(): ...@@ -34,8 +36,10 @@ def calculate_score():
os.system(cmd) os.system(cmd)
cmd = "cd %s && export PYTHONPATH=. && python tools/clean_photo.py --tool_name magicpdf --download_dir %s" % (code_path, data_path) cmd = "cd %s && export PYTHONPATH=. && python tools/clean_photo.py --tool_name magicpdf --download_dir %s" % (code_path, data_path)
os.system(cmd) os.system(cmd)
cmd = "cd %s && export PYTHONPATH=. && python tools/markdown_calculate.py --tool_name magicpdf --download_dir %s --results %s" % (code_path, data_path, os.path.join(data_path, "result.json")) score = markdown_calculate.Scoring()
os.system(cmd) score.calculate_similarity_total("magicpdf", file_types, os.path.join(data_path, "result.json"))
res = score.summary_scores()
return res
def extrat_zip(zip_file_path, extract_to_path): def extrat_zip(zip_file_path, extract_to_path):
...@@ -49,9 +53,24 @@ def extrat_zip(zip_file_path, extract_to_path): ...@@ -49,9 +53,24 @@ def extrat_zip(zip_file_path, extract_to_path):
def ci_ben(): def ci_ben():
fr = open(os.path.join(pdf_dev_path, "ci", "result.json"), "r").read() fr = open(os.path.join(pdf_dev_path, "ci", "result.json"), "r").read()
lines = fr.readlines()
last_line = lines[-1].strip()
if __name__ == "__main__": last_score = json.loads(last_line)
print ("last_score:", last_score)
last_simscore = last_score["average_sim_score"]
last_editdistance = last_score["average_edit_distance"]
last_bleu = last_score["average_bleu_score"]
extrat_zip(os.path.join(pdf_dev_path, 'output.zip'), os.path.join(pdf_dev_path)) extrat_zip(os.path.join(pdf_dev_path, 'output.zip'), os.path.join(pdf_dev_path))
test_cli() test_cli()
calculate_score() now_score = calculate_score()
print ("now_score:", now_score)
now_simscore = now_score["average_sim_score"]
now_editdistance = now_score["average_edit_distance"]
now_bleu = now_score["average_bleu_score"]
assert last_simscore <= now_simscore
assert last_editdistance <= now_editdistance
assert last_bleu <= now_bleu
if __name__ == "__main__":
ci_ben()
...@@ -116,7 +116,7 @@ class Scoring: ...@@ -116,7 +116,7 @@ class Scoring:
over_all_dict["average_bleu_score"] = average_bleu_score over_all_dict["average_bleu_score"] = average_bleu_score
over_all_dict["average_sim_score"] = average_sim_score over_all_dict["average_sim_score"] = average_sim_score
fw.write(json.dumps(over_all_dict, ensure_ascii=False) + "\n") fw.write(json.dumps(over_all_dict, ensure_ascii=False) + "\n")
return over_all_dict
def calculate_similarity_total(self, tool_type, file_types, download_dir): def calculate_similarity_total(self, tool_type, file_types, download_dir):
for file_type in file_types: for file_type in file_types:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment