metafile.yml 3.09 KB
Newer Older
renzhc's avatar
renzhc committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
Collections:
  - Name: Visual-Attention-Network
    Metadata:
      Training Data: ImageNet-1k
      Training Techniques:
        - AdamW
        - Weight Decay
      Architecture:
        - Visual Attention Network
    Paper:
      URL: https://arxiv.org/abs/2202.09741
      Title: "Visual Attention Network"
    README: configs/van/README.md
    Code:
      URL: https://github.com/open-mmlab/mmpretrain/blob/v0.23.0/mmcls/models/backbones/van.py
      Version: v0.23.0

Models:
  - Name: van-tiny_3rdparty_in1k
    Metadata:
      Parameters: 4110000      # 4.11M
      FLOPs: 880000000   # 0.88G
    In Collection: Visual-Attention-Network
    Results:
      - Dataset: ImageNet-1k
        Metrics:
          Top 1 Accuracy: 75.41
          Top 5 Accuracy: 93.02
        Task: Image Classification
    Weights: https://download.openmmlab.com/mmclassification/v0/van/van-tiny_8xb128_in1k_20220501-385941af.pth
    Config: configs/van/van-tiny_8xb128_in1k.py
    Converted From:
      Code: https://github.com/Visual-Attention-Network/VAN-Classification
      Weights: https://cloud.tsinghua.edu.cn/f/aada2242a16245d6a561/?dl=1
  - Name: van-small_3rdparty_in1k
    Metadata:
      Parameters:  13860000          # 13.86M
      FLOPs: 2520000000    # 2.52G
    In Collection: Visual-Attention-Network
    Results:
        - Dataset: ImageNet-1k
          Metrics:
            Top 1 Accuracy: 81.01
            Top 5 Accuracy: 95.63
          Task: Image Classification
    Weights: https://download.openmmlab.com/mmclassification/v0/van/van-small_8xb128_in1k_20220501-17bc91aa.pth
    Config: configs/van/van-small_8xb128_in1k.py
    Converted From:
      Code: https://github.com/Visual-Attention-Network/VAN-Classification
      Weights: https://cloud.tsinghua.edu.cn/f/dd3eb73692f74a2499c9/?dl=1
  - Name: van-base_3rdparty_in1k
    Metadata:
      Parameters: 26580000            # 26.58M
      FLOPs: 5030000000                # 5.03G
    In Collection: Visual-Attention-Network
    Results:
        - Dataset: ImageNet-1k
          Metrics:
            Top 1 Accuracy: 82.80
            Top 5 Accuracy: 96.21
          Task: Image Classification
    Weights: https://download.openmmlab.com/mmclassification/v0/van/van-base_8xb128_in1k_20220501-6a4cc31b.pth
    Config: configs/van/van-base_8xb128_in1k.py
    Converted From:
      Code: https://github.com/Visual-Attention-Network/VAN-Classification
      Weights: https://cloud.tsinghua.edu.cn/f/58e7acceaf334ecdba89/?dl=1
  - Name: van-large_3rdparty_in1k
    Metadata:
      Parameters: 44770000              # 44.77 M
      FLOPs: 8990000000              # 8.99G
    In Collection: Visual-Attention-Network
    Results:
        - Dataset: ImageNet-1k
          Metrics:
            Top 1 Accuracy: 83.86
            Top 5 Accuracy: 96.73
          Task: Image Classification
    Weights: https://download.openmmlab.com/mmclassification/v0/van/van-large_8xb128_in1k_20220501-f212ba21.pth
    Config: configs/van/van-large_8xb128_in1k.py
    Converted From:
      Code: https://github.com/Visual-Attention-Network/VAN-Classification
      Weights: https://cloud.tsinghua.edu.cn/f/0201745f6920482490a0/?dl=1