download_test_data.py 838 Bytes
Newer Older
wuxk1's avatar
wuxk1 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import os
from pathlib import Path

import wget
import yaml
from tqdm import tqdm


def main():
    with open(Path(__file__).resolve().parent.parent / "test_data" / "images.yaml", "r") as f:
        config = yaml.safe_load(f)
    for group in config.get("images", []):
        base_url = group["base_url"]
        download_dir = group.get("download_dir", "input")
        for filename in tqdm(group["files"], desc="Downloading"):
            output_path = os.path.join(download_dir, filename)
            if os.path.exists(output_path):
                print(f"File {filename} already exists, skipping download.")
                continue
            print(f"Downloading {filename}...")
            full_url = base_url.format(filename=filename)
            wget.download(full_url, out=output_path)


if __name__ == "__main__":
    main()