Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
ModelZoo
InternVL3_pytorch
Commits
26e59280
"web/vscode:/vscode.git/clone" did not exist on "a1f12e370dc694a26528c382e81b2e5e297934e0"
Commit
26e59280
authored
Apr 24, 2025
by
wanglch
Browse files
Initial commit
parents
Pipeline
#2674
failed with stages
in 0 seconds
Changes
841
Pipelines
1
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
737 additions
and
0 deletions
+737
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenet_r.yaml
...g_intern_vit_6b_224px_in1k_224to448_64gpu_imagenet_r.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenet_real.yaml
...ntern_vit_6b_224px_in1k_224to448_64gpu_imagenet_real.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenet_sketch.yaml
...ern_vit_6b_224px_in1k_224to448_64gpu_imagenet_sketch.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenetv2.yaml
...g_intern_vit_6b_224px_in1k_224to448_64gpu_imagenetv2.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu.yaml
...near_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu.yaml
+36
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_a.yaml
...g_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_a.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_r.yaml
...g_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_r.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_real.yaml
...ntern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_real.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_sketch.yaml
...ern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_sketch.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenetv2.yaml
...g_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenetv2.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu.yaml
...near_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu.yaml
+36
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_a.yaml
...g_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_a.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_r.yaml
...g_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_r.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_real.yaml
...ntern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_real.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_sketch.yaml
...ern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_sketch.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenetv2.yaml
...g_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenetv2.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu.yaml
...near_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu.yaml
+36
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_a.yaml
...g_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_a.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_r.yaml
...g_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_r.yaml
+37
-0
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_real.yaml
...ntern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_real.yaml
+37
-0
No files found.
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenet_r.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_r'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-r'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
224
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
48
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_224px.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenet_real.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet-real'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-1k'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
224
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
48
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_224px.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenet_sketch.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_sketch'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-sketch'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
224
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
48
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_224px.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_224px_in1k_224to448_64gpu_imagenetv2.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenetv2'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenetv2'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
224
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
48
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_224px.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-1k'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_0.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_a.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_a'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-a'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_0.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_r.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_r'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-r'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_0.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_real.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet-real'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-1k'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_0.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenet_sketch.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_sketch'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-sketch'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_0.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_0_in1k_448_64gpu_imagenetv2.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenetv2'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenetv2'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_0.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-1k'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_2.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_a.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_a'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-a'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_2.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_r.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_r'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-r'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_2.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_real.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet-real'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-1k'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_2.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenet_sketch.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_sketch'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-sketch'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_2.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_2_in1k_448_64gpu_imagenetv2.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenetv2'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenetv2'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_2.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-1k'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_5.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_a.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_a'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-a'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_5.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_r.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet_r'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-r'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_5.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
classification/configs/linear_probing/linear_probing_intern_vit_6b_448px_v1_5_in1k_448_64gpu_imagenet_real.yaml
0 → 100644
View file @
26e59280
DATA
:
IMG_ON_MEMORY
:
False
BATCH_SIZE
:
16
# single GPU batch size
DATASET
:
'
imagenet-real'
TRANSFORM
:
'
build_transform_for_linear_probe'
DATA_PATH
:
'
./data/imagenet-1k'
IMG_SIZE
:
448
MODEL
:
TYPE
:
intern_vit_6b
DROP_PATH_RATE
:
0.0
INTERN_VIT_6B
:
FREEZE_VIT
:
True
PATCH_SIZE
:
14
PRETRAIN_SIZE
:
448
QKV_BIAS
:
False
EMBED_DIM
:
3200
NUM_HEADS
:
25
MLP_RATIO
:
4
INIT_VALUES
:
0.1
QK_NORMALIZATION
:
True
DEPTH
:
45
USE_FLASH_ATTN
:
True
PRETRAINED
:
"
./pretrained/intern_vit_6b_448px_v1_5.pth"
CLS_TARGET
:
'
cls_patch_concat'
TRAIN
:
EMA
:
ENABLE
:
True
DECAY
:
0.998
EPOCHS
:
10
WARMUP_EPOCHS
:
1
WEIGHT_DECAY
:
0.0
BASE_LR
:
0.1
# 512
WARMUP_LR
:
.0
MIN_LR
:
.0
LR_LAYER_DECAY
:
false
OPTIMIZER
:
NAME
:
'
sgd'
Prev
1
2
3
4
5
6
7
8
…
43
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment