collect_model_urls.py 528 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
import pathlib
import re
import sys

MODEL_URL_PATTERN = re.compile(r"https://download[.]pytorch[.]org/models/.*?[.]pth")


def main(root):
    model_urls = set()
    for path in pathlib.Path(root).glob("**/*"):
        if path.name.startswith("_") or not path.suffix == ".py":
            continue

        with open(path, "r") as file:
            for line in file:
                model_urls.update(MODEL_URL_PATTERN.findall(line))

    print("\n".join(sorted(model_urls)))


if __name__ == "__main__":
    main(sys.argv[1])