auto_quick_check_config.json 421 Bytes
Newer Older
liuxu3's avatar
liuxu3 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
{
    "DCU": "BW1000",  
    "vllm_version": "0.9.2",    
    "pkg_version": "dtk25.04.1",
    "dst_path": "./result/",
    "items":[
        {
            "model_name": "Qwen3-32B",
            "model_path": "/data/models/Qwen3-32B/",
            "dtype": "float16",
            "tensor_parallel": [4],
            "batch_size": [128, 64, 32, 16],
            "seqlen_tuple": ["512 512", "1024 1024"]  
        }
    ]
}