"app/vscode:/vscode.git/clone" did not exist on "3b6a9154dde490da393630e7790136e7f516d3c1"
get_ci_error_statistics.py 10.2 KB
Newer Older
1
2
3
4
5
import argparse
import json
import math
import os
import time
6
import traceback
7
8
9
10
11
12
import zipfile
from collections import Counter

import requests


13
def get_job_links(workflow_run_id, token=None):
14
15
    """Extract job names and their job links in a GitHub Actions workflow run"""

16
17
18
19
    headers = None
    if token is not None:
        headers = {"Accept": "application/vnd.github+json", "Authorization": f"Bearer {token}"}

20
    url = f"https://api.github.com/repos/huggingface/transformers/actions/runs/{workflow_run_id}/jobs?per_page=100"
21
    result = requests.get(url, headers=headers).json()
22
23
24
25
26
27
28
    job_links = {}

    try:
        job_links.update({job["name"]: job["html_url"] for job in result["jobs"]})
        pages_to_iterate_over = math.ceil((result["total_count"] - 100) / 100)

        for i in range(pages_to_iterate_over):
29
            result = requests.get(url + f"&page={i + 2}", headers=headers).json()
30
31
32
            job_links.update({job["name"]: job["html_url"] for job in result["jobs"]})

        return job_links
33
34
    except Exception:
        print(f"Unknown error, could not fetch links:\n{traceback.format_exc()}")
35
36
37
38

    return {}


39
def get_artifacts_links(worflow_run_id, token=None):
40
41
    """Get all artifact links from a workflow run"""

42
43
44
45
    headers = None
    if token is not None:
        headers = {"Accept": "application/vnd.github+json", "Authorization": f"Bearer {token}"}

46
    url = f"https://api.github.com/repos/huggingface/transformers/actions/runs/{worflow_run_id}/artifacts?per_page=100"
47
    result = requests.get(url, headers=headers).json()
48
49
50
51
52
53
54
    artifacts = {}

    try:
        artifacts.update({artifact["name"]: artifact["archive_download_url"] for artifact in result["artifacts"]})
        pages_to_iterate_over = math.ceil((result["total_count"] - 100) / 100)

        for i in range(pages_to_iterate_over):
55
            result = requests.get(url + f"&page={i + 2}", headers=headers).json()
56
57
58
            artifacts.update({artifact["name"]: artifact["archive_download_url"] for artifact in result["artifacts"]})

        return artifacts
59
60
    except Exception:
        print(f"Unknown error, could not fetch links:\n{traceback.format_exc()}")
61
62
63
64
65
66
67

    return {}


def download_artifact(artifact_name, artifact_url, output_dir, token):
    """Download a GitHub Action artifact from a URL.

68
    The URL is of the form `https://api.github.com/repos/huggingface/transformers/actions/artifacts/{ARTIFACT_ID}/zip`,
69
70
71
    but it can't be used to download directly. We need to get a redirect URL first.
    See https://docs.github.com/en/rest/actions/artifacts#download-an-artifact
    """
72
73
74
75
76
77
78
79
80
81
    headers = None
    if token is not None:
        headers = {"Accept": "application/vnd.github+json", "Authorization": f"Bearer {token}"}

    result = requests.get(artifact_url, headers=headers, allow_redirects=False)
    download_url = result.headers["Location"]
    response = requests.get(download_url, allow_redirects=True)
    file_path = os.path.join(output_dir, f"{artifact_name}.zip")
    with open(file_path, "wb") as fp:
        fp.write(response.content)
82
83


84
def get_errors_from_single_artifact(artifact_zip_path, job_links=None):
85
86
87
    """Extract errors from a downloaded artifact (in .zip format)"""
    errors = []
    failed_tests = []
88
    job_name = None
89
90
91
92
93

    with zipfile.ZipFile(artifact_zip_path) as z:
        for filename in z.namelist():
            if not os.path.isdir(filename):
                # read the file
94
                if filename in ["failures_line.txt", "summary_short.txt", "job_name.txt"]:
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
                    with z.open(filename) as f:
                        for line in f:
                            line = line.decode("UTF-8").strip()
                            if filename == "failures_line.txt":
                                try:
                                    # `error_line` is the place where `error` occurs
                                    error_line = line[: line.index(": ")]
                                    error = line[line.index(": ") + len(": ") :]
                                    errors.append([error_line, error])
                                except Exception:
                                    # skip un-related lines
                                    pass
                            elif filename == "summary_short.txt" and line.startswith("FAILED "):
                                # `test` is the test method that failed
                                test = line[len("FAILED ") :]
                                failed_tests.append(test)
111
112
                            elif filename == "job_name.txt":
                                job_name = line
113
114
115
116
117
118
119
120

    if len(errors) != len(failed_tests):
        raise ValueError(
            f"`errors` and `failed_tests` should have the same number of elements. Got {len(errors)} for `errors` "
            f"and {len(failed_tests)} for `failed_tests` instead. The test reports in {artifact_zip_path} have some"
            " problem."
        )

121
122
123
124
125
126
127
128
    job_link = None
    if job_name and job_links:
        job_link = job_links.get(job_name, None)

    # A list with elements of the form (line of error, error, failed test)
    result = [x + [y] + [job_link] for x, y in zip(errors, failed_tests)]

    return result
129
130


131
def get_all_errors(artifact_dir, job_links=None):
132
133
134
135
136
137
    """Extract errors from all artifact files"""

    errors = []

    paths = [os.path.join(artifact_dir, p) for p in os.listdir(artifact_dir) if p.endswith(".zip")]
    for p in paths:
138
        errors.extend(get_errors_from_single_artifact(p, job_links=job_links))
139

140
    return errors
141
142


143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
def reduce_by_error(logs, error_filter=None):
    """count each error"""

    counter = Counter()
    counter.update([x[1] for x in logs])
    counts = counter.most_common()
    r = {}
    for error, count in counts:
        if error_filter is None or error not in error_filter:
            r[error] = {"count": count, "failed_tests": [(x[2], x[0]) for x in logs if x[1] == error]}

    r = dict(sorted(r.items(), key=lambda item: item[1]["count"], reverse=True))
    return r


def get_model(test):
    """Get the model name from a test method"""
    test = test.split("::")[0]
    if test.startswith("tests/models/"):
        test = test.split("/")[2]
    else:
        test = None

    return test


def reduce_by_model(logs, error_filter=None):
    """count each error per model"""

    logs = [(x[0], x[1], get_model(x[2])) for x in logs]
    logs = [x for x in logs if x[2] is not None]
174
    tests = {x[2] for x in logs}
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191

    r = {}
    for test in tests:
        counter = Counter()
        # count by errors in `test`
        counter.update([x[1] for x in logs if x[2] == test])
        counts = counter.most_common()
        error_counts = {error: count for error, count in counts if (error_filter is None or error not in error_filter)}
        n_errors = sum(error_counts.values())
        if n_errors > 0:
            r[test] = {"count": n_errors, "errors": error_counts}

    r = dict(sorted(r.items(), key=lambda item: item[1]["count"], reverse=True))
    return r


def make_github_table(reduced_by_error):
192
193
    header = "| no. | error | status |"
    sep = "|-:|:-|:-|"
194
195
196
    lines = [header, sep]
    for error in reduced_by_error:
        count = reduced_by_error[error]["count"]
197
        line = f"| {count} | {error[:100]} |  |"
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
        lines.append(line)

    return "\n".join(lines)


def make_github_table_per_model(reduced_by_model):
    header = "| model | no. of errors | major error | count |"
    sep = "|-:|-:|-:|-:|"
    lines = [header, sep]
    for model in reduced_by_model:
        count = reduced_by_model[model]["count"]
        error, _count = list(reduced_by_model[model]["errors"].items())[0]
        line = f"| {model} | {count} | {error[:60]} | {_count} |"
        lines.append(line)

    return "\n".join(lines)


216
217
218
if __name__ == "__main__":
    parser = argparse.ArgumentParser()
    # Required parameters
219
    parser.add_argument("--workflow_run_id", type=str, required=True, help="A GitHub Actions workflow run id.")
220
221
222
223
224
225
    parser.add_argument(
        "--output_dir",
        type=str,
        required=True,
        help="Where to store the downloaded artifacts and other result files.",
    )
226
    parser.add_argument("--token", default=None, type=str, help="A token that has actions:read permission.")
227
228
229
230
    args = parser.parse_args()

    os.makedirs(args.output_dir, exist_ok=True)

231
    _job_links = get_job_links(args.workflow_run_id, token=args.token)
232
233
234
235
236
237
238
239
240
241
242
243
244
    job_links = {}
    # To deal with `workflow_call` event, where a job name is the combination of the job names in the caller and callee.
    # For example, `PyTorch 1.11 / Model tests (models/albert, single-gpu)`.
    if _job_links:
        for k, v in _job_links.items():
            # This is how GitHub actions combine job names.
            if " / " in k:
                index = k.find(" / ")
                k = k[index + len(" / ") :]
            job_links[k] = v
    with open(os.path.join(args.output_dir, "job_links.json"), "w", encoding="UTF-8") as fp:
        json.dump(job_links, fp, ensure_ascii=False, indent=4)

245
    artifacts = get_artifacts_links(args.workflow_run_id, token=args.token)
246
247
248
249
250
251
252
253
    with open(os.path.join(args.output_dir, "artifacts.json"), "w", encoding="UTF-8") as fp:
        json.dump(artifacts, fp, ensure_ascii=False, indent=4)

    for idx, (name, url) in enumerate(artifacts.items()):
        download_artifact(name, url, args.output_dir, args.token)
        # Be gentle to GitHub
        time.sleep(1)

254
    errors = get_all_errors(args.output_dir, job_links=job_links)
255

256
    # `e[1]` is the error
257
258
259
260
261
262
263
264
265
266
267
    counter = Counter()
    counter.update([e[1] for e in errors])

    # print the top 30 most common test errors
    most_common = counter.most_common(30)
    for item in most_common:
        print(item)

    with open(os.path.join(args.output_dir, "errors.json"), "w", encoding="UTF-8") as fp:
        json.dump(errors, fp, ensure_ascii=False, indent=4)

268
269
    reduced_by_error = reduce_by_error(errors)
    reduced_by_model = reduce_by_model(errors)
270
271
272
273
274
275
276
277

    s1 = make_github_table(reduced_by_error)
    s2 = make_github_table_per_model(reduced_by_model)

    with open(os.path.join(args.output_dir, "reduced_by_error.txt"), "w", encoding="UTF-8") as fp:
        fp.write(s1)
    with open(os.path.join(args.output_dir, "reduced_by_model.txt"), "w", encoding="UTF-8") as fp:
        fp.write(s2)