Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
ModelZoo
open_clip_pytorch
Commits
6f43e8fa
Commit
6f43e8fa
authored
Sep 14, 2024
by
mashun1
Browse files
open_clip
parents
Pipeline
#1689
canceled with stages
Changes
217
Pipelines
1
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
436 additions
and
0 deletions
+436
-0
src/open_clip/model_configs/ViT-L-14-CLIPA-336.json
src/open_clip/model_configs/ViT-L-14-CLIPA-336.json
+26
-0
src/open_clip/model_configs/ViT-L-14-CLIPA.json
src/open_clip/model_configs/ViT-L-14-CLIPA.json
+26
-0
src/open_clip/model_configs/ViT-L-14-quickgelu.json
src/open_clip/model_configs/ViT-L-14-quickgelu.json
+18
-0
src/open_clip/model_configs/ViT-L-14.json
src/open_clip/model_configs/ViT-L-14.json
+17
-0
src/open_clip/model_configs/ViT-L-16-320.json
src/open_clip/model_configs/ViT-L-16-320.json
+17
-0
src/open_clip/model_configs/ViT-L-16-SigLIP-256.json
src/open_clip/model_configs/ViT-L-16-SigLIP-256.json
+30
-0
src/open_clip/model_configs/ViT-L-16-SigLIP-384.json
src/open_clip/model_configs/ViT-L-16-SigLIP-384.json
+30
-0
src/open_clip/model_configs/ViT-L-16.json
src/open_clip/model_configs/ViT-L-16.json
+17
-0
src/open_clip/model_configs/ViT-M-16-alt.json
src/open_clip/model_configs/ViT-M-16-alt.json
+18
-0
src/open_clip/model_configs/ViT-M-16.json
src/open_clip/model_configs/ViT-M-16.json
+17
-0
src/open_clip/model_configs/ViT-M-32-alt.json
src/open_clip/model_configs/ViT-M-32-alt.json
+17
-0
src/open_clip/model_configs/ViT-M-32.json
src/open_clip/model_configs/ViT-M-32.json
+17
-0
src/open_clip/model_configs/ViT-S-16-alt.json
src/open_clip/model_configs/ViT-S-16-alt.json
+17
-0
src/open_clip/model_configs/ViT-S-16.json
src/open_clip/model_configs/ViT-S-16.json
+17
-0
src/open_clip/model_configs/ViT-S-32-alt.json
src/open_clip/model_configs/ViT-S-32-alt.json
+17
-0
src/open_clip/model_configs/ViT-S-32.json
src/open_clip/model_configs/ViT-S-32.json
+17
-0
src/open_clip/model_configs/ViT-SO400M-14-SigLIP-384.json
src/open_clip/model_configs/ViT-SO400M-14-SigLIP-384.json
+31
-0
src/open_clip/model_configs/ViT-SO400M-14-SigLIP.json
src/open_clip/model_configs/ViT-SO400M-14-SigLIP.json
+31
-0
src/open_clip/model_configs/ViT-bigG-14-CLIPA-336.json
src/open_clip/model_configs/ViT-bigG-14-CLIPA-336.json
+28
-0
src/open_clip/model_configs/ViT-bigG-14-CLIPA.json
src/open_clip/model_configs/ViT-bigG-14-CLIPA.json
+28
-0
No files found.
src/open_clip/model_configs/ViT-L-14-CLIPA-336.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
768
,
"vision_cfg"
:
{
"image_size"
:
336
,
"layers"
:
24
,
"width"
:
1024
,
"patch_size"
:
14
,
"no_ln_pre"
:
true
,
"pool_type"
:
"avg"
,
"final_ln_after_pool"
:
true
},
"text_cfg"
:
{
"context_length"
:
32
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"bert-base-uncased"
,
"tokenizer_kwargs"
:
{
"strip_sep_token"
:
true
},
"width"
:
768
,
"heads"
:
12
,
"layers"
:
12
,
"pool_type"
:
"last"
,
"no_causal_mask"
:
true
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-L-14-CLIPA.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
768
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
24
,
"width"
:
1024
,
"patch_size"
:
14
,
"no_ln_pre"
:
true
,
"pool_type"
:
"avg"
,
"final_ln_after_pool"
:
true
},
"text_cfg"
:
{
"context_length"
:
32
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"bert-base-uncased"
,
"tokenizer_kwargs"
:
{
"strip_sep_token"
:
true
},
"width"
:
768
,
"heads"
:
12
,
"layers"
:
12
,
"pool_type"
:
"last"
,
"no_causal_mask"
:
true
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-L-14-quickgelu.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
768
,
"quick_gelu"
:
true
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
24
,
"width"
:
1024
,
"patch_size"
:
14
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
768
,
"heads"
:
12
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-L-14.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
768
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
24
,
"width"
:
1024
,
"patch_size"
:
14
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
768
,
"heads"
:
12
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-L-16-320.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
768
,
"vision_cfg"
:
{
"image_size"
:
320
,
"layers"
:
24
,
"width"
:
1024
,
"patch_size"
:
16
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
768
,
"heads"
:
12
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-L-16-SigLIP-256.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
1024
,
"init_logit_bias"
:
-10
,
"custom_text"
:
true
,
"vision_cfg"
:
{
"image_size"
:
256
,
"timm_model_name"
:
"vit_large_patch16_siglip_256"
,
"timm_model_pretrained"
:
false
,
"timm_pool"
:
"map"
,
"timm_proj"
:
"none"
},
"text_cfg"
:
{
"context_length"
:
64
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"timm/ViT-B-16-SigLIP"
,
"tokenizer_kwargs"
:
{
"clean"
:
"canonicalize"
},
"width"
:
1024
,
"heads"
:
16
,
"layers"
:
24
,
"no_causal_mask"
:
true
,
"proj_bias"
:
true
,
"pool_type"
:
"last"
,
"norm_kwargs"
:{
"eps"
:
1e-6
}
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-L-16-SigLIP-384.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
1024
,
"init_logit_bias"
:
-10
,
"custom_text"
:
true
,
"vision_cfg"
:
{
"image_size"
:
384
,
"timm_model_name"
:
"vit_large_patch16_siglip_384"
,
"timm_model_pretrained"
:
false
,
"timm_pool"
:
"map"
,
"timm_proj"
:
"none"
},
"text_cfg"
:
{
"context_length"
:
64
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"timm/ViT-B-16-SigLIP"
,
"tokenizer_kwargs"
:
{
"clean"
:
"canonicalize"
},
"width"
:
1024
,
"heads"
:
16
,
"layers"
:
24
,
"no_causal_mask"
:
true
,
"proj_bias"
:
true
,
"pool_type"
:
"last"
,
"norm_kwargs"
:{
"eps"
:
1e-6
}
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-L-16.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
768
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
24
,
"width"
:
1024
,
"patch_size"
:
16
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
768
,
"heads"
:
12
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-M-16-alt.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
384
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
512
,
"patch_size"
:
16
,
"ls_init_value"
:
1e-4
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
384
,
"heads"
:
6
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-M-16.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
512
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
512
,
"patch_size"
:
16
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
512
,
"heads"
:
8
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-M-32-alt.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
384
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
512
,
"patch_size"
:
32
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
384
,
"heads"
:
6
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-M-32.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
512
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
512
,
"patch_size"
:
32
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
512
,
"heads"
:
8
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-S-16-alt.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
256
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
384
,
"patch_size"
:
16
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
256
,
"heads"
:
4
,
"layers"
:
10
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-S-16.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
384
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
384
,
"patch_size"
:
16
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
384
,
"heads"
:
6
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-S-32-alt.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
256
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
384
,
"patch_size"
:
32
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
256
,
"heads"
:
4
,
"layers"
:
10
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-S-32.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
384
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
12
,
"width"
:
384
,
"patch_size"
:
32
},
"text_cfg"
:
{
"context_length"
:
77
,
"vocab_size"
:
49408
,
"width"
:
384
,
"heads"
:
6
,
"layers"
:
12
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-SO400M-14-SigLIP-384.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
1152
,
"init_logit_bias"
:
-10
,
"custom_text"
:
true
,
"vision_cfg"
:
{
"image_size"
:
384
,
"timm_model_name"
:
"vit_so400m_patch14_siglip_384"
,
"timm_model_pretrained"
:
false
,
"timm_pool"
:
"map"
,
"timm_proj"
:
"none"
},
"text_cfg"
:
{
"context_length"
:
64
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"timm/ViT-B-16-SigLIP"
,
"tokenizer_kwargs"
:
{
"clean"
:
"canonicalize"
},
"width"
:
1152
,
"heads"
:
16
,
"layers"
:
27
,
"mlp_ratio"
:
3.7362
,
"no_causal_mask"
:
true
,
"proj_bias"
:
true
,
"pool_type"
:
"last"
,
"norm_kwargs"
:{
"eps"
:
1e-6
}
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-SO400M-14-SigLIP.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
1152
,
"init_logit_bias"
:
-10
,
"custom_text"
:
true
,
"vision_cfg"
:
{
"image_size"
:
224
,
"timm_model_name"
:
"vit_so400m_patch14_siglip_224"
,
"timm_model_pretrained"
:
false
,
"timm_pool"
:
"map"
,
"timm_proj"
:
"none"
},
"text_cfg"
:
{
"context_length"
:
16
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"timm/ViT-B-16-SigLIP"
,
"tokenizer_kwargs"
:
{
"clean"
:
"canonicalize"
},
"width"
:
1152
,
"heads"
:
16
,
"layers"
:
27
,
"mlp_ratio"
:
3.7362
,
"no_causal_mask"
:
true
,
"proj_bias"
:
true
,
"pool_type"
:
"last"
,
"norm_kwargs"
:{
"eps"
:
1e-6
}
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-bigG-14-CLIPA-336.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
1280
,
"vision_cfg"
:
{
"image_size"
:
336
,
"layers"
:
48
,
"width"
:
1664
,
"head_width"
:
104
,
"mlp_ratio"
:
4.9231
,
"patch_size"
:
14
,
"no_ln_pre"
:
true
,
"pool_type"
:
"avg"
,
"final_ln_after_pool"
:
true
},
"text_cfg"
:
{
"context_length"
:
32
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"bert-base-uncased"
,
"tokenizer_kwargs"
:
{
"strip_sep_token"
:
true
},
"width"
:
1280
,
"heads"
:
20
,
"layers"
:
32
,
"pool_type"
:
"last"
,
"no_causal_mask"
:
true
}
}
\ No newline at end of file
src/open_clip/model_configs/ViT-bigG-14-CLIPA.json
0 → 100755
View file @
6f43e8fa
{
"embed_dim"
:
1280
,
"vision_cfg"
:
{
"image_size"
:
224
,
"layers"
:
48
,
"width"
:
1664
,
"head_width"
:
104
,
"mlp_ratio"
:
4.9231
,
"patch_size"
:
14
,
"no_ln_pre"
:
true
,
"pool_type"
:
"avg"
,
"final_ln_after_pool"
:
true
},
"text_cfg"
:
{
"context_length"
:
32
,
"vocab_size"
:
32000
,
"hf_tokenizer_name"
:
"bert-base-uncased"
,
"tokenizer_kwargs"
:
{
"strip_sep_token"
:
true
},
"width"
:
1280
,
"heads"
:
20
,
"layers"
:
32
,
"pool_type"
:
"last"
,
"no_causal_mask"
:
true
}
}
\ No newline at end of file
Prev
1
…
3
4
5
6
7
8
9
10
11
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment