Unverified Commit 94e593ce authored by gushiqiao's avatar gushiqiao Committed by GitHub
Browse files

[Recon] remove mm_config and support load single safetensors file (#375)

parent 954df466
...@@ -14,9 +14,8 @@ ...@@ -14,9 +14,8 @@
"use_31_block": false, "use_31_block": false,
"t5_quantized": true, "t5_quantized": true,
"t5_quant_scheme": "fp8-q8f", "t5_quant_scheme": "fp8-q8f",
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F" "dit_quant_scheme": "fp8-q8f",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"cpu_offload": false, "cpu_offload": false,
......
...@@ -13,9 +13,8 @@ ...@@ -13,9 +13,8 @@
"enable_cfg": false, "enable_cfg": false,
"cpu_offload": false, "cpu_offload": false,
"use_31_block": false, "use_31_block": false,
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -13,9 +13,8 @@ ...@@ -13,9 +13,8 @@
"enable_cfg": false, "enable_cfg": false,
"cpu_offload": false, "cpu_offload": false,
"use_31_block": false, "use_31_block": false,
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -13,9 +13,10 @@ ...@@ -13,9 +13,10 @@
"enable_cfg": false, "enable_cfg": false,
"cpu_offload": false, "cpu_offload": false,
"use_31_block": false, "use_31_block": false,
"mm_config": { "clip_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "clip_quant_scheme": "fp8",
}, "dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -17,9 +17,8 @@ ...@@ -17,9 +17,8 @@
"seq_p_size": 8, "seq_p_size": 8,
"seq_p_attn_type": "ulysses" "seq_p_attn_type": "ulysses"
}, },
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -27,7 +27,6 @@ ...@@ -27,7 +27,6 @@
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"vae_cpu_offload": false, "vae_cpu_offload": false,
"use_tiling_vae": false, "use_tiling_vae": false,
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F" "dit_quant_scheme": "fp8-sgl"
}
} }
...@@ -26,7 +26,6 @@ ...@@ -26,7 +26,6 @@
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"vae_cpu_offload": false, "vae_cpu_offload": false,
"use_tiling_vae": false, "use_tiling_vae": false,
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl"
}
} }
...@@ -17,9 +17,8 @@ ...@@ -17,9 +17,8 @@
"seq_p_size": 4, "seq_p_size": 4,
"seq_p_attn_type": "ulysses" "seq_p_attn_type": "ulysses"
}, },
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -21,9 +21,8 @@ ...@@ -21,9 +21,8 @@
"seq_p_size": 4, "seq_p_size": 4,
"seq_p_attn_type": "ulysses" "seq_p_attn_type": "ulysses"
}, },
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -22,9 +22,8 @@ ...@@ -22,9 +22,8 @@
"seq_p_size": 8, "seq_p_size": 8,
"seq_p_attn_type": "ulysses" "seq_p_attn_type": "ulysses"
}, },
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -53,9 +53,8 @@ ...@@ -53,9 +53,8 @@
"seq_p_size": 8, "seq_p_size": 8,
"seq_p_attn_type": "ulysses" "seq_p_attn_type": "ulysses"
}, },
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -54,9 +54,8 @@ ...@@ -54,9 +54,8 @@
"seq_p_size": 8, "seq_p_size": 8,
"seq_p_attn_type": "ulysses" "seq_p_attn_type": "ulysses"
}, },
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -17,9 +17,8 @@ ...@@ -17,9 +17,8 @@
"seq_p_size": 8, "seq_p_size": 8,
"seq_p_attn_type": "ulysses" "seq_p_attn_type": "ulysses"
}, },
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"adapter_quantized": true, "adapter_quantized": true,
"adapter_quant_scheme": "fp8", "adapter_quant_scheme": "fp8",
"t5_quantized": true, "t5_quantized": true,
......
...@@ -19,9 +19,8 @@ ...@@ -19,9 +19,8 @@
"refert_num": 1, "refert_num": 1,
"replace_flag": false, "replace_flag": false,
"fps": 30, "fps": 30,
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F" "dit_quant_scheme": "fp8-sgl",
},
"t5_quantized": true, "t5_quantized": true,
"t5_quant_scheme": "fp8", "t5_quant_scheme": "fp8",
"clip_quantized": true, "clip_quantized": true,
......
...@@ -21,9 +21,8 @@ ...@@ -21,9 +21,8 @@
"refert_num": 1, "refert_num": 1,
"fps": 30, "fps": 30,
"replace_flag": true, "replace_flag": true,
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F" "dit_quant_scheme": "fp8-q8f",
},
"t5_quantized": true, "t5_quantized": true,
"t5_quant_scheme": "fp8", "t5_quant_scheme": "fp8",
"clip_quantized": true, "clip_quantized": true,
......
...@@ -25,9 +25,8 @@ ...@@ -25,9 +25,8 @@
500, 500,
250 250
], ],
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl" "dit_quant_scheme": "fp8-sgl",
},
"t5_quantized": true, "t5_quantized": true,
"t5_quant_scheme": "fp8" "t5_quant_scheme": "fp8"
} }
...@@ -25,9 +25,8 @@ ...@@ -25,9 +25,8 @@
500, 500,
250 250
], ],
"mm_config": { "dit_quantized": true,
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Vllm" "dit_quant_scheme": "int8-vllm",
},
"t5_quantized": true, "t5_quantized": true,
"t5_quant_scheme": "int8" "t5_quant_scheme": "int8"
} }
...@@ -24,7 +24,5 @@ ...@@ -24,7 +24,5 @@
750, 750,
500, 500,
250 250
], ]
"dit_distill_ckpt_high": "Wan2.2-I2V-A14B/distill_models/high_noise_model/distill_model.safetensors",
"dit_distill_ckpt_low": "Wan2.2-I2V-A14B/distill_models/low_noise_model/distill_model.safetensors"
} }
...@@ -25,9 +25,8 @@ ...@@ -25,9 +25,8 @@
500, 500,
250 250
], ],
"mm_config": { "dit_quantized": true,
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F" "dit_quant_scheme": "fp8-q8f",
},
"t5_quantized": true, "t5_quantized": true,
"t5_quant_scheme": "fp8-q8f" "t5_quant_scheme": "fp8-q8f"
} }
...@@ -25,9 +25,8 @@ ...@@ -25,9 +25,8 @@
500, 500,
250 250
], ],
"mm_config": { "dit_quantized": true,
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Vllm" "dit_quant_scheme": "fp8-sgl",
},
"t5_quantized": true, "t5_quantized": true,
"t5_quant_scheme": "int8" "t5_quant_scheme": "fp8"
} }
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment