matrix_game2_universal_streaming.json 1.77 KB
Newer Older
xuwx1's avatar
xuwx1 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
{
    "infer_steps": 50,
    "target_video_length": 360,
    "num_output_frames": 360,
    "text_len": 512,
    "target_height": 352,
    "target_width": 640,
    "self_attn_1_type": "flash_attn2",
    "cross_attn_1_type": "flash_attn2",
    "cross_attn_2_type": "flash_attn2",
    "seed": 0,
    "sample_guide_scale": 6,
    "sample_shift": 8,
    "enable_cfg": false,
    "cpu_offload": false,
    "sf_config": {
        "local_attn_size": 6,
        "shift": 5.0,
        "num_frame_per_block": 3,
        "num_transformer_blocks": 30,
        "frame_seq_length": 880,
        "num_output_frames": 360,
        "num_inference_steps": 1000,
        "denoising_step_list": [1000.0000,  908.8427,  713.9794]
    },
    "sub_model_folder": "base_distilled_model",
    "sub_model_name": "base_distill.safetensors",
    "mode": "universal",
    "streaming": true,
    "action_config": {
        "blocks": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14],
        "enable_keyboard": true,
        "enable_mouse": true,
        "heads_num": 16,
        "hidden_size": 128,
        "img_hidden_size": 1536,
        "keyboard_dim_in": 4,
        "keyboard_hidden_dim": 1024,
        "mouse_dim_in": 2,
        "mouse_hidden_dim": 1024,
        "mouse_qk_dim_list": [
        8,
        28,
        28
        ],
        "patch_size": [
        1,
        2,
        2
        ],
        "qk_norm": true,
        "qkv_bias": false,
        "rope_dim_list": [
        8,
        28,
        28
        ],
        "rope_theta": 256,
        "vae_time_compression_ratio": 4,
        "windows_size": 3
    },
    "dim": 1536,
    "eps": 1e-06,
    "ffn_dim": 8960,
    "freq_dim": 256,
    "in_dim": 36,
    "inject_sample_info": false,
    "model_type": "i2v",
    "num_heads": 12,
    "num_layers": 30,
    "out_dim": 16
}