Unverified Commit 94e593ce authored by gushiqiao's avatar gushiqiao Committed by GitHub
Browse files

[Recon] remove mm_config and support load single safetensors file (#375)

parent 954df466
......@@ -10,8 +10,7 @@
"sample_shift": 5,
"enable_cfg": true,
"cpu_offload": false,
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl-ActVllm"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"use_tiling_vae": true
}
......@@ -16,8 +16,7 @@
500,
250
],
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl-ActVllm"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"use_tiling_vae": true
}
......@@ -10,9 +10,8 @@
"sample_shift": 5,
"enable_cfg": true,
"cpu_offload": false,
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Sgl-ActVllm"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"feature_caching": "Tea",
"coefficients": [
[
......
......@@ -13,8 +13,7 @@
"offload_granularity": "block",
"offload_ratio": 0.8,
"t5_cpu_offload": true,
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"use_tiling_vae": true
}
......@@ -19,8 +19,7 @@
500,
250
],
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"use_tiling_vae": true
}
......@@ -13,8 +13,7 @@
"offload_granularity": "block",
"offload_ratio": 0.8,
"t5_cpu_offload": true,
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"use_tiling_vae": true
}
......@@ -19,8 +19,7 @@
500,
250
],
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"use_tiling_vae": true
}
......@@ -15,5 +15,12 @@
750,
500,
250
]
],
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Vllm"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl",
"dit_quantized_ckpt": "/data/nvme0/gushiqiao/models/hf_lightx2v_models/models/wan2.1_i2v_480p_scaled_fp8_e4m3_lightx2v_4step.safetensors"
}
......@@ -16,5 +16,6 @@
750,
500,
250
]
],
"dit_original_ckpt": "/data/nvme0/gushiqiao/models/hf_lightx2v_models/models/wan2.1_t2v_14b_lightx2v_4step.safetensors"
}
......@@ -13,7 +13,6 @@
"cpu_offload": true,
"offload_granularity": "block",
"t5_cpu_offload": true,
"mm_config": {
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Vllm"
}
"dit_quantized": true,
"dit_quant_scheme": "fp8-sgl"
}
......@@ -13,9 +13,8 @@
"offload_granularity": "phase",
"t5_offload_granularity": "block",
"dit_quantized_ckpt": "/path/to/dit_quant_model",
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Vllm"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-vllm",
"t5_cpu_offload": true,
"t5_quantized": true,
"t5_quantized_ckpt": "/path/to/models_t5_umt5-xxl-enc-fp8.pth",
......
......@@ -13,9 +13,8 @@
"offload_granularity": "phase",
"t5_offload_granularity": "block",
"dit_quantized_ckpt": "/path/to/dit_quant_model",
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Vllm"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-vllm",
"t5_cpu_offload": true,
"t5_quantized": true,
"t5_quantized_ckpt": "/path/to/models_t5_umt5-xxl-enc-fp8.pth",
......
......@@ -14,9 +14,8 @@
"t5_cpu_offload": true,
"offload_granularity": "phase",
"dit_quantized_ckpt": "/path/to/dit_int8",
"mm_config": {
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "int8-q8f",
"use_tiny_vae": true,
"tiny_vae_path": "/x2v_models/taew2_1.pth",
"t5_offload_granularity": "block"
......
{
"infer_steps": 20,
"target_video_length": 33,
"i2v_resolution": "720p",
"attention_type": "flash_attn3",
"dit_quantized_ckpt": "/path/to/int8/model",
"mm_config": {
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Vllm"
}
}
......@@ -11,7 +11,6 @@
"enable_cfg": true,
"cpu_offload": false,
"dit_quantized_ckpt": "/path/to/int8/model",
"mm_config": {
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Vllm"
}
"dit_quantized": true,
"dit_quant_scheme": "int8-vllm"
}
......@@ -10,9 +10,8 @@
"sample_shift": 5,
"enable_cfg": false,
"cpu_offload": false,
"mm_config": {
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "int8-q8f",
"t5_quantized": true,
"t5_quant_scheme": "int8-q8f",
"clip_quantized": true,
......
......@@ -10,9 +10,8 @@
"sample_shift": 5,
"enable_cfg": false,
"cpu_offload": false,
"mm_config": {
"mm_type": "W-int8-channel-sym-A-int8-channel-sym-dynamic-Torchao"
},
"dit_quantized": true,
"dit_quant_scheme": "int8-torchao",
"t5_quantized": true,
"t5_quant_scheme": "int8-torchao",
"clip_quantized": true,
......
......@@ -14,9 +14,8 @@
"use_31_block": false,
"t5_quantized": true,
"t5_quant_scheme": "fp8-q8f",
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-q8f",
"adapter_quantized": true,
"adapter_quant_scheme": "fp8",
"cpu_offload": false,
......
......@@ -14,9 +14,8 @@
"use_31_block": false,
"t5_quantized": true,
"t5_quant_scheme": "fp8-q8f",
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-q8f",
"adapter_quantized": true,
"adapter_quant_scheme": "fp8",
"cpu_offload": false,
......
......@@ -14,9 +14,8 @@
"use_31_block": false,
"t5_quantized": true,
"t5_quant_scheme": "fp8-q8f",
"mm_config": {
"mm_type": "W-fp8-channel-sym-A-fp8-channel-sym-dynamic-Q8F"
},
"dit_quantized": true,
"dit_quant_scheme": "fp8-q8f",
"adapter_quantized": true,
"adapter_quant_scheme": "fp8",
"cpu_offload": false,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment