Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
Bw-bestperf
pd-test
Commits
dd80c5ce
Commit
dd80c5ce
authored
Feb 06, 2026
by
jerrrrry
Browse files
Upload New File
parent
eb4e8683
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
59 additions
and
0 deletions
+59
-0
bf16_2_w4a8/config-w4a8.json
bf16_2_w4a8/config-w4a8.json
+59
-0
No files found.
bf16_2_w4a8/config-w4a8.json
0 → 100644
View file @
dd80c5ce
{
"architectures"
:
[
"DeepseekV3ForCausalLM"
],
"attention_bias"
:
false
,
"attention_dropout"
:
0.0
,
"auto_map"
:
{
"AutoConfig"
:
"configuration_deepseek.DeepseekV3Config"
,
"AutoModel"
:
"modeling_deepseek.DeepseekV3Model"
,
"AutoModelForCausalLM"
:
"modeling_deepseek.DeepseekV3ForCausalLM"
},
"bos_token_id"
:
0
,
"eos_token_id"
:
1
,
"ep_size"
:
1
,
"first_k_dense_replace"
:
3
,
"hidden_act"
:
"silu"
,
"hidden_size"
:
7168
,
"initializer_range"
:
0.02
,
"intermediate_size"
:
18432
,
"kv_lora_rank"
:
512
,
"max_position_embeddings"
:
163840
,
"model_type"
:
"deepseek_v3"
,
"moe_intermediate_size"
:
2048
,
"moe_layer_freq"
:
1
,
"n_group"
:
8
,
"n_routed_experts"
:
256
,
"n_shared_experts"
:
1
,
"norm_topk_prob"
:
true
,
"num_attention_heads"
:
128
,
"num_experts_per_tok"
:
8
,
"num_hidden_layers"
:
61
,
"num_key_value_heads"
:
128
,
"num_nextn_predict_layers"
:
1
,
"q_lora_rank"
:
1536
,
"qk_nope_head_dim"
:
128
,
"qk_rope_head_dim"
:
64
,
"quantization_config"
:
{
"activation_scheme"
:
"dynamic"
,
"quant_method"
:
"slimquant_w4a8"
},
"rms_norm_eps"
:
1e-06
,
"rope_scaling"
:
{
"beta_fast"
:
32
,
"beta_slow"
:
1
,
"factor"
:
40
,
"mscale"
:
1.0
,
"mscale_all_dim"
:
1.0
,
"original_max_position_embeddings"
:
4096
,
"type"
:
"yarn"
},
"rope_theta"
:
10000
,
"routed_scaling_factor"
:
2.5
,
"scoring_func"
:
"sigmoid"
,
"tie_word_embeddings"
:
false
,
"topk_group"
:
4
,
"topk_method"
:
"noaux_tc"
,
"torch_dtype"
:
"bfloat16"
,
"transformers_version"
:
"4.46.3"
,
"use_cache"
:
true
,
"v_head_dim"
:
128
,
"vocab_size"
:
129280
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment