auto_quick_check_config.json 527 Bytes
Newer Older
liuxu3's avatar
liuxu3 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
{
    "DCU": "BW1000",  
    "vllm_version": "0.9.2",    
    "pkg_version": "dtk25.04.1",
    "dst_path": "./result/",
    "items":[
        {
            "model_name": "Qwen3-32B",
            "model_path": "/data/models/Qwen3-32B/",
            "dtype": "float16",
            "tensor_parallel": [4],
            "batch_size_start": 4,
            "batch_size_interval": 4,
            "seqlen_tuple": ["512 512", "1024 1024"],
            "ttft_thres": [3000, 3000],
            "tpot_thres": [100, "inf"]
        }
    ]
}