auto_quick_check_config.json 448 Bytes
Newer Older
liuxu3's avatar
liuxu3 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
{
    "DCU": "BW1000",  
    "vllm_version": "0.11.0",    
    "pkg_version": "dtk25.04.2",
    "dst_path": "./result/",
    "items":[
        {
            "model_name": "Qwen3-32B",
            "model_path": "/data/models/Qwen3-32B/",
            "dtype": "float16",
            "tensor_parallel": [2, 4],
            "batch_size": [1, 4, 8, 16, 32, 64, 128],
            "seqlen_tuple": ["512 512", "4096 1024", "16384 1024"]  
        }
    ]
}