Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
MMPretrain-MMCV
Commits
dff2c686
Commit
dff2c686
authored
Sep 03, 2024
by
renzhc
Browse files
first commit
parent
8f9dd0ed
Pipeline
#1665
canceled with stages
Changes
1000
Pipelines
2
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
384 additions
and
0 deletions
+384
-0
configs/_base_/models/itpn_hivit-base-p16.py
configs/_base_/models/itpn_hivit-base-p16.py
+33
-0
configs/_base_/models/levit-256-p16.py
configs/_base_/models/levit-256-p16.py
+26
-0
configs/_base_/models/mae_hivit-base-p16.py
configs/_base_/models/mae_hivit-base-p16.py
+24
-0
configs/_base_/models/mae_vit-base-p16.py
configs/_base_/models/mae_vit-base-p16.py
+23
-0
configs/_base_/models/mixmim/mixmim_base.py
configs/_base_/models/mixmim/mixmim_base.py
+20
-0
configs/_base_/models/mlp_mixer_base_patch16.py
configs/_base_/models/mlp_mixer_base_patch16.py
+25
-0
configs/_base_/models/mlp_mixer_large_patch16.py
configs/_base_/models/mlp_mixer_large_patch16.py
+25
-0
configs/_base_/models/mobilenet_v2_1x.py
configs/_base_/models/mobilenet_v2_1x.py
+12
-0
configs/_base_/models/mobilenet_v3/mobilenet_v3_large_imagenet.py
..._base_/models/mobilenet_v3/mobilenet_v3_large_imagenet.py
+16
-0
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_050_imagenet.py
...e_/models/mobilenet_v3/mobilenet_v3_small_050_imagenet.py
+16
-0
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_075_imagenet.py
...e_/models/mobilenet_v3/mobilenet_v3_small_075_imagenet.py
+16
-0
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_cifar.py
...gs/_base_/models/mobilenet_v3/mobilenet_v3_small_cifar.py
+13
-0
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_imagenet.py
..._base_/models/mobilenet_v3/mobilenet_v3_small_imagenet.py
+16
-0
configs/_base_/models/mobileone/mobileone_s0.py
configs/_base_/models/mobileone/mobileone_s0.py
+19
-0
configs/_base_/models/mobileone/mobileone_s1.py
configs/_base_/models/mobileone/mobileone_s1.py
+19
-0
configs/_base_/models/mobileone/mobileone_s2.py
configs/_base_/models/mobileone/mobileone_s2.py
+19
-0
configs/_base_/models/mobileone/mobileone_s3.py
configs/_base_/models/mobileone/mobileone_s3.py
+19
-0
configs/_base_/models/mobileone/mobileone_s4.py
configs/_base_/models/mobileone/mobileone_s4.py
+19
-0
configs/_base_/models/mobilevit/mobilevit_s.py
configs/_base_/models/mobilevit/mobilevit_s.py
+12
-0
configs/_base_/models/mobilevit/mobilevit_xs.py
configs/_base_/models/mobilevit/mobilevit_xs.py
+12
-0
No files found.
Too many changes to show.
To preserve performance only
1000 of 1000+
files are displayed.
Plain diff
Email patch
configs/_base_/models/itpn_hivit-base-p16.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'iTPN'
,
backbone
=
dict
(
type
=
'iTPNHiViT'
,
arch
=
'base'
,
reconstruction_type
=
'pixel'
,
mask_ratio
=
0.75
),
neck
=
dict
(
type
=
'iTPNPretrainDecoder'
,
num_patches
=
196
,
patch_size
=
16
,
in_chans
=
3
,
embed_dim
=
512
,
decoder_embed_dim
=
512
,
decoder_depth
=
6
,
decoder_num_heads
=
16
,
mlp_ratio
=
4.
,
reconstruction_type
=
'pixel'
,
# transformer pyramid
fpn_dim
=
256
,
fpn_depth
=
2
,
num_outs
=
3
,
),
head
=
dict
(
type
=
'MAEPretrainHead'
,
norm_pix
=
True
,
patch_size
=
16
,
loss
=
dict
(
type
=
'PixelReconstructionLoss'
,
criterion
=
'L2'
)),
init_cfg
=
[
dict
(
type
=
'Xavier'
,
layer
=
'Linear'
,
distribution
=
'uniform'
),
dict
(
type
=
'Constant'
,
layer
=
'LayerNorm'
,
val
=
1.0
,
bias
=
0.0
)
])
configs/_base_/models/levit-256-p16.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'LeViT'
,
arch
=
'256'
,
img_size
=
224
,
patch_size
=
16
,
drop_path_rate
=
0
,
attn_ratio
=
2
,
mlp_ratio
=
2
,
out_indices
=
(
2
,
)),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LeViTClsHead'
,
num_classes
=
1000
,
in_channels
=
512
,
distillation
=
True
,
loss
=
dict
(
type
=
'LabelSmoothLoss'
,
label_smooth_val
=
0.1
,
loss_weight
=
1.0
),
topk
=
(
1
,
5
),
),
train_cfg
=
dict
(
augments
=
[
dict
(
type
=
'Mixup'
,
alpha
=
0.8
),
dict
(
type
=
'CutMix'
,
alpha
=
1.0
),
]))
configs/_base_/models/mae_hivit-base-p16.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'MAE'
,
backbone
=
dict
(
type
=
'MAEHiViT'
,
patch_size
=
16
,
arch
=
'base'
,
mask_ratio
=
0.75
),
neck
=
dict
(
type
=
'MAEPretrainDecoder'
,
patch_size
=
16
,
in_chans
=
3
,
embed_dim
=
512
,
decoder_embed_dim
=
512
,
decoder_depth
=
6
,
decoder_num_heads
=
16
,
mlp_ratio
=
4.
,
),
head
=
dict
(
type
=
'MAEPretrainHead'
,
norm_pix
=
True
,
patch_size
=
16
,
loss
=
dict
(
type
=
'PixelReconstructionLoss'
,
criterion
=
'L2'
)),
init_cfg
=
[
dict
(
type
=
'Xavier'
,
layer
=
'Linear'
,
distribution
=
'uniform'
),
dict
(
type
=
'Constant'
,
layer
=
'LayerNorm'
,
val
=
1.0
,
bias
=
0.0
)
])
configs/_base_/models/mae_vit-base-p16.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'MAE'
,
backbone
=
dict
(
type
=
'MAEViT'
,
arch
=
'b'
,
patch_size
=
16
,
mask_ratio
=
0.75
),
neck
=
dict
(
type
=
'MAEPretrainDecoder'
,
patch_size
=
16
,
in_chans
=
3
,
embed_dim
=
768
,
decoder_embed_dim
=
512
,
decoder_depth
=
8
,
decoder_num_heads
=
16
,
mlp_ratio
=
4.
,
),
head
=
dict
(
type
=
'MAEPretrainHead'
,
norm_pix
=
True
,
patch_size
=
16
,
loss
=
dict
(
type
=
'PixelReconstructionLoss'
,
criterion
=
'L2'
)),
init_cfg
=
[
dict
(
type
=
'Xavier'
,
layer
=
'Linear'
,
distribution
=
'uniform'
),
dict
(
type
=
'Constant'
,
layer
=
'LayerNorm'
,
val
=
1.0
,
bias
=
0.0
)
])
configs/_base_/models/mixmim/mixmim_base.py
0 → 100644
View file @
dff2c686
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MixMIMTransformer'
,
arch
=
'B'
,
drop_rate
=
0.0
,
drop_path_rate
=
0.1
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
1024
,
init_cfg
=
None
,
loss
=
dict
(
type
=
'LabelSmoothLoss'
,
label_smooth_val
=
0.1
,
mode
=
'original'
),
cal_acc
=
False
),
init_cfg
=
[
dict
(
type
=
'TruncNormal'
,
layer
=
'Linear'
,
std
=
0.02
,
bias
=
0.
),
dict
(
type
=
'Constant'
,
layer
=
'LayerNorm'
,
val
=
1.
,
bias
=
0.
)
],
train_cfg
=
dict
(
augments
=
[
dict
(
type
=
'Mixup'
,
alpha
=
0.8
),
dict
(
type
=
'CutMix'
,
alpha
=
1.0
)
]))
configs/_base_/models/mlp_mixer_base_patch16.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MlpMixer'
,
arch
=
'b'
,
img_size
=
224
,
patch_size
=
16
,
drop_rate
=
0.1
,
init_cfg
=
[
dict
(
type
=
'Kaiming'
,
layer
=
'Conv2d'
,
mode
=
'fan_in'
,
nonlinearity
=
'linear'
)
]),
neck
=
dict
(
type
=
'GlobalAveragePooling'
,
dim
=
1
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
768
,
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
topk
=
(
1
,
5
),
),
)
configs/_base_/models/mlp_mixer_large_patch16.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MlpMixer'
,
arch
=
'l'
,
img_size
=
224
,
patch_size
=
16
,
drop_rate
=
0.1
,
init_cfg
=
[
dict
(
type
=
'Kaiming'
,
layer
=
'Conv2d'
,
mode
=
'fan_in'
,
nonlinearity
=
'linear'
)
]),
neck
=
dict
(
type
=
'GlobalAveragePooling'
,
dim
=
1
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
1024
,
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
topk
=
(
1
,
5
),
),
)
configs/_base_/models/mobilenet_v2_1x.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileNetV2'
,
widen_factor
=
1.0
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
1280
,
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
topk
=
(
1
,
5
),
))
configs/_base_/models/mobilenet_v3/mobilenet_v3_large_imagenet.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileNetV3'
,
arch
=
'large'
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'StackedLinearClsHead'
,
num_classes
=
1000
,
in_channels
=
960
,
mid_channels
=
[
1280
],
dropout_rate
=
0.2
,
act_cfg
=
dict
(
type
=
'HSwish'
),
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
init_cfg
=
dict
(
type
=
'Normal'
,
layer
=
'Linear'
,
mean
=
0.
,
std
=
0.01
,
bias
=
0.
),
topk
=
(
1
,
5
)))
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_050_imagenet.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileNetV3'
,
arch
=
'small_050'
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'StackedLinearClsHead'
,
num_classes
=
1000
,
in_channels
=
288
,
mid_channels
=
[
1024
],
dropout_rate
=
0.2
,
act_cfg
=
dict
(
type
=
'HSwish'
),
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
init_cfg
=
dict
(
type
=
'Normal'
,
layer
=
'Linear'
,
mean
=
0.
,
std
=
0.01
,
bias
=
0.
),
topk
=
(
1
,
5
)))
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_075_imagenet.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileNetV3'
,
arch
=
'small_075'
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'StackedLinearClsHead'
,
num_classes
=
1000
,
in_channels
=
432
,
mid_channels
=
[
1024
],
dropout_rate
=
0.2
,
act_cfg
=
dict
(
type
=
'HSwish'
),
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
init_cfg
=
dict
(
type
=
'Normal'
,
layer
=
'Linear'
,
mean
=
0.
,
std
=
0.01
,
bias
=
0.
),
topk
=
(
1
,
5
)))
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_cifar.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileNetV3'
,
arch
=
'small'
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'StackedLinearClsHead'
,
num_classes
=
10
,
in_channels
=
576
,
mid_channels
=
[
1280
],
act_cfg
=
dict
(
type
=
'HSwish'
),
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
topk
=
(
1
,
5
)))
configs/_base_/models/mobilenet_v3/mobilenet_v3_small_imagenet.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileNetV3'
,
arch
=
'small'
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'StackedLinearClsHead'
,
num_classes
=
1000
,
in_channels
=
576
,
mid_channels
=
[
1024
],
dropout_rate
=
0.2
,
act_cfg
=
dict
(
type
=
'HSwish'
),
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
init_cfg
=
dict
(
type
=
'Normal'
,
layer
=
'Linear'
,
mean
=
0.
,
std
=
0.01
,
bias
=
0.
),
topk
=
(
1
,
5
)))
configs/_base_/models/mobileone/mobileone_s0.py
0 → 100644
View file @
dff2c686
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileOne'
,
arch
=
's0'
,
out_indices
=
(
3
,
),
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
1024
,
loss
=
dict
(
type
=
'LabelSmoothLoss'
,
label_smooth_val
=
0.1
,
mode
=
'original'
,
),
topk
=
(
1
,
5
),
))
configs/_base_/models/mobileone/mobileone_s1.py
0 → 100644
View file @
dff2c686
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileOne'
,
arch
=
's1'
,
out_indices
=
(
3
,
),
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
1280
,
loss
=
dict
(
type
=
'LabelSmoothLoss'
,
label_smooth_val
=
0.1
,
mode
=
'original'
,
),
topk
=
(
1
,
5
),
))
configs/_base_/models/mobileone/mobileone_s2.py
0 → 100644
View file @
dff2c686
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileOne'
,
arch
=
's2'
,
out_indices
=
(
3
,
),
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
2048
,
loss
=
dict
(
type
=
'LabelSmoothLoss'
,
label_smooth_val
=
0.1
,
mode
=
'original'
,
),
topk
=
(
1
,
5
),
))
configs/_base_/models/mobileone/mobileone_s3.py
0 → 100644
View file @
dff2c686
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileOne'
,
arch
=
's3'
,
out_indices
=
(
3
,
),
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
2048
,
loss
=
dict
(
type
=
'LabelSmoothLoss'
,
label_smooth_val
=
0.1
,
mode
=
'original'
,
),
topk
=
(
1
,
5
),
))
configs/_base_/models/mobileone/mobileone_s4.py
0 → 100644
View file @
dff2c686
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileOne'
,
arch
=
's4'
,
out_indices
=
(
3
,
),
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
2048
,
loss
=
dict
(
type
=
'LabelSmoothLoss'
,
label_smooth_val
=
0.1
,
mode
=
'original'
,
),
topk
=
(
1
,
5
),
))
configs/_base_/models/mobilevit/mobilevit_s.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileViT'
,
arch
=
'small'
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
640
,
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
topk
=
(
1
,
5
),
))
configs/_base_/models/mobilevit/mobilevit_xs.py
0 → 100644
View file @
dff2c686
# model settings
model
=
dict
(
type
=
'ImageClassifier'
,
backbone
=
dict
(
type
=
'MobileViT'
,
arch
=
'x_small'
),
neck
=
dict
(
type
=
'GlobalAveragePooling'
),
head
=
dict
(
type
=
'LinearClsHead'
,
num_classes
=
1000
,
in_channels
=
384
,
loss
=
dict
(
type
=
'CrossEntropyLoss'
,
loss_weight
=
1.0
),
topk
=
(
1
,
5
),
))
Prev
1
…
5
6
7
8
9
10
11
12
13
…
50
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment