Commit 85762c1a authored by Xiaowei.zhang's avatar Xiaowei.zhang
Browse files

Init the main branch for aiter

parent ae0b3521
Pipeline #3505 canceled with stages
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,no_quant,torch.float16,1,256,8192,256,4,0,0,ck,576,309.8021428571405
gfx936,no_quant,torch.float16,8,256,8192,256,4,0,0,ck,576,364.40785714285965
gfx936,no_quant,torch.float16,16,256,8192,256,4,0,0,ck,576,705.001571428565
gfx936,no_quant,torch.float16,24,256,8192,256,4,0,0,ck,272,1028.2664285714334
gfx936,no_quant,torch.float16,32,256,8192,256,4,0,0,ck,576,1293.2290000000055
gfx936,no_quant,torch.float16,48,256,8192,256,4,0,0,ck,272,1877.2707142857207
gfx936,no_quant,torch.float16,64,256,8192,256,4,0,0,ck,576,2193.247142857142
gfx936,no_quant,torch.float16,96,256,8192,256,4,0,0,ck,272,2471.966714285715
gfx936,no_quant,torch.float16,128,256,8192,256,4,0,0,ck,576,2724.7889999999948
gfx936,no_quant,torch.float16,256,256,8192,256,4,0,0,ck,576,3391.9192857142875
gfx936,no_quant,torch.float16,512,256,8192,256,4,0,0,ck,576,3537.358999999999
gfx936,no_quant,torch.float16,1024,256,8192,256,4,0,0,ck,272,5022.04200000001
gfx936,no_quant,torch.float16,2048,256,8192,256,4,0,0,ck,272,6217.148285714277
gfx936,no_quant,torch.float16,4096,256,8192,256,4,0,0,ck,272,8764.503571428571
gfx936,no_quant,torch.float16,8192,256,8192,256,4,0,0,ck,272,16520.489142857128
gfx936,no_quant,torch.float16,1,256,7168,256,8,0,0,ck,576,274.4422857142844
gfx936,no_quant,torch.float16,8,256,7168,256,8,0,0,ck,576,584.9560000000014
gfx936,no_quant,torch.float16,16,256,7168,256,8,0,0,ck,576,1056.360857142859
gfx936,no_quant,torch.float16,24,256,7168,256,8,0,0,ck,576,1480.196999999999
gfx936,no_quant,torch.float16,32,256,7168,256,8,0,0,ck,576,1867.970714285712
gfx936,no_quant,torch.float16,48,256,7168,256,8,0,0,ck,576,2312.378428571425
gfx936,no_quant,torch.float16,64,256,7168,256,8,0,0,ck,576,2382.001142857145
gfx936,no_quant,torch.float16,96,256,7168,256,8,0,0,ck,576,2795.691714285705
gfx936,no_quant,torch.float16,128,256,7168,256,8,0,0,ck,576,2820.2631428571426
gfx936,no_quant,torch.float16,256,256,7168,256,8,0,0,ck,576,3055.348428571423
gfx936,no_quant,torch.float16,512,256,7168,256,8,0,0,ck,272,4095.392285714287
gfx936,no_quant,torch.float16,1024,256,7168,256,8,0,0,ck,272,5514.589714285707
gfx936,no_quant,torch.float16,2048,256,7168,256,8,0,0,ck,272,7718.288428571438
gfx936,no_quant,torch.float16,4096,256,7168,256,8,0,0,ck,272,14435.327142857148
gfx936,no_quant,torch.float16,8192,256,7168,256,8,0,0,ck,272,27862.7415
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,int8_w8a8_block,torch.float16,1,256,7168,256,8,128,128,ck,1073741824,221.7238
gfx936,int8_w8a8_block,torch.float16,2,256,7168,256,8,128,128,ck,1073741824,271.6008
gfx936,int8_w8a8_block,torch.float16,3,256,7168,256,8,128,128,ck,256,347.8034
gfx936,int8_w8a8_block,torch.float16,4,256,7168,256,8,128,128,ck,256,351.302
gfx936,int8_w8a8_block,torch.float16,5,256,7168,256,8,128,128,ck,256,358.7936
gfx936,int8_w8a8_block,torch.float16,6,256,7168,256,8,128,128,ck,256,449.8388
gfx936,int8_w8a8_block,torch.float16,7,256,7168,256,8,128,128,ck,256,447.4445
gfx936,int8_w8a8_block,torch.float16,8,256,7168,256,8,128,128,ck,256,454.0529
gfx936,int8_w8a8_block,torch.float16,9,256,7168,256,8,128,128,ck,256,470.7523
gfx936,int8_w8a8_block,torch.float16,10,256,7168,256,8,128,128,ck,256,496.542
gfx936,int8_w8a8_block,torch.float16,11,256,7168,256,8,128,128,ck,256,496.3151
gfx936,int8_w8a8_block,torch.float16,12,256,7168,256,8,128,128,ck,256,517.557
gfx936,int8_w8a8_block,torch.float16,13,256,7168,256,8,128,128,ck,256,710.8428
gfx936,int8_w8a8_block,torch.float16,14,256,7168,256,8,128,128,ck,256,719.7744
gfx936,int8_w8a8_block,torch.float16,15,256,7168,256,8,128,128,ck,256,708.893
gfx936,int8_w8a8_block,torch.float16,16,256,7168,256,8,128,128,ck,256,736.713
gfx936,int8_w8a8_block,torch.float16,17,256,7168,256,8,128,128,ck,256,723.91
gfx936,int8_w8a8_block,torch.float16,18,256,7168,256,8,128,128,ck,256,731.7118
gfx936,int8_w8a8_block,torch.float16,19,256,7168,256,8,128,128,ck,256,921.5805
gfx936,int8_w8a8_block,torch.float16,20,256,7168,256,8,128,128,ck,256,931.757
gfx936,int8_w8a8_block,torch.float16,21,256,7168,256,8,128,128,ck,256,925.7805
gfx936,int8_w8a8_block,torch.float16,22,256,7168,256,8,128,128,ck,256,933.0314
gfx936,int8_w8a8_block,torch.float16,23,256,7168,256,8,128,128,ck,256,946.4677
gfx936,int8_w8a8_block,torch.float16,24,256,7168,256,8,128,128,ck,256,966.1805
gfx936,int8_w8a8_block,torch.float16,25,256,7168,256,8,128,128,ck,256,957.8053
gfx936,int8_w8a8_block,torch.float16,26,256,7168,256,8,128,128,ck,256,994.1703
gfx936,int8_w8a8_block,torch.float16,27,256,7168,256,8,128,128,ck,256,1027.6255
gfx936,int8_w8a8_block,torch.float16,28,256,7168,256,8,128,128,ck,256,986.7748
gfx936,int8_w8a8_block,torch.float16,29,256,7168,256,8,128,128,ck,256,1012.4916
gfx936,int8_w8a8_block,torch.float16,30,256,7168,256,8,128,128,ck,256,1031.3195
gfx936,int8_w8a8_block,torch.float16,31,256,7168,256,8,128,128,ck,256,1210.7522
gfx936,int8_w8a8_block,torch.float16,32,256,7168,256,8,128,128,ck,256,1213.3539
gfx936,int8_w8a8_block,torch.float16,34,256,7168,256,8,128,128,ck,256,1217.8463
gfx936,int8_w8a8_block,torch.float16,36,256,7168,256,8,128,128,ck,256,1229.2845
gfx936,int8_w8a8_block,torch.float16,40,256,7168,256,8,128,128,ck,256,1246.6734
gfx936,int8_w8a8_block,torch.float16,44,256,7168,256,8,128,128,ck,256,1268.3449
gfx936,int8_w8a8_block,torch.float16,48,256,7168,256,8,128,128,ck,256,1448.0706
gfx936,int8_w8a8_block,torch.float16,56,256,7168,256,8,128,128,ck,256,1448.6066
gfx936,int8_w8a8_block,torch.float16,64,256,7168,256,8,128,128,ck,256,1533.3137
gfx936,int8_w8a8_block,torch.float16,68,256,7168,256,8,128,128,ck,256,1533.2071
gfx936,int8_w8a8_block,torch.float16,72,256,7168,256,8,128,128,ck,256,1543.6504
gfx936,int8_w8a8_block,torch.float16,80,256,7168,256,8,128,128,ck,256,1557.7885
gfx936,int8_w8a8_block,torch.float16,88,256,7168,256,8,128,128,ck,256,1569.5416
gfx936,int8_w8a8_block,torch.float16,96,256,7168,256,8,128,128,ck,256,1748.5222
gfx936,int8_w8a8_block,torch.float16,104,256,7168,256,8,128,128,ck,256,1780.6233
gfx936,int8_w8a8_block,torch.float16,112,256,7168,256,8,128,128,ck,256,1788.6033
gfx936,int8_w8a8_block,torch.float16,128,256,7168,256,8,128,128,ck,256,1808.0838
gfx936,int8_w8a8_block,torch.float16,144,256,7168,256,8,128,128,ck,256,1837.7577
gfx936,int8_w8a8_block,torch.float16,160,256,7168,256,8,128,128,ck,256,1852.4556
gfx936,int8_w8a8_block,torch.float16,192,256,7168,256,8,128,128,ck,256,1883.3793
gfx936,int8_w8a8_block,torch.float16,224,256,7168,256,8,128,128,ck,256,1923.4614
gfx936,int8_w8a8_block,torch.float16,256,256,7168,256,8,128,128,ck,256,1958.9242
gfx936,int8_w8a8_block,torch.float16,320,256,7168,256,8,128,128,ck,256,2031.9791
gfx936,int8_w8a8_block,torch.float16,384,256,7168,256,8,128,128,ck,256,2129.4956
gfx936,int8_w8a8_block,torch.float16,448,256,7168,256,8,128,128,ck,256,2504.2611
gfx936,int8_w8a8_block,torch.float16,512,256,7168,256,8,128,128,ck,256,2790.1238
gfx936,int8_w8a8_block,torch.float16,768,256,7168,256,8,128,128,ck,1073741824,3529.9268
gfx936,int8_w8a8_block,torch.float16,1024,256,7168,256,8,128,128,ck,256,4366.3522
gfx936,int8_w8a8_block,torch.float16,1024,256,7168,256,8,128,128,ck,256,4391.4689
gfx936,int8_w8a8_block,torch.float16,1152,256,7168,256,8,128,128,ck,256,4889.4998
gfx936,int8_w8a8_block,torch.float16,1,2304,7168,256,8,128,128,ck,256,560.4577
gfx936,int8_w8a8_block,torch.float16,2,2304,7168,256,8,128,128,ck,1073741824,922.3036
gfx936,int8_w8a8_block,torch.float16,3,2304,7168,256,8,128,128,ck,256,1211.5382
gfx936,int8_w8a8_block,torch.float16,4,2304,7168,256,8,128,128,ck,256,1609.7351
gfx936,int8_w8a8_block,torch.float16,5,2304,7168,256,8,128,128,ck,256,2033.1529
gfx936,int8_w8a8_block,torch.float16,6,2304,7168,256,8,128,128,ck,256,2095.9823
gfx936,int8_w8a8_block,torch.float16,7,2304,7168,256,8,128,128,ck,256,2525.8506
gfx936,int8_w8a8_block,torch.float16,8,2304,7168,256,8,128,128,ck,256,3121.4785
gfx936,int8_w8a8_block,torch.float16,9,2304,7168,256,8,128,128,ck,256,3602.7825
gfx936,int8_w8a8_block,torch.float16,10,2304,7168,256,8,128,128,ck,256,3449.7641
gfx936,int8_w8a8_block,torch.float16,11,2304,7168,256,8,128,128,ck,256,4044.0698
gfx936,int8_w8a8_block,torch.float16,12,2304,7168,256,8,128,128,ck,256,4134.7811
gfx936,int8_w8a8_block,torch.float16,13,2304,7168,256,8,128,128,ck,256,4802.8215
gfx936,int8_w8a8_block,torch.float16,14,2304,7168,256,8,128,128,ck,256,4719.2344
gfx936,int8_w8a8_block,torch.float16,15,2304,7168,256,8,128,128,ck,256,4980.6316
gfx936,int8_w8a8_block,torch.float16,16,2304,7168,256,8,128,128,ck,256,5250.5172
gfx936,int8_w8a8_block,torch.float16,17,2304,7168,256,8,128,128,ck,256,5673.4436
gfx936,int8_w8a8_block,torch.float16,18,2304,7168,256,8,128,128,ck,256,5719.9952
gfx936,int8_w8a8_block,torch.float16,19,2304,7168,256,8,128,128,ck,256,6126.3857
gfx936,int8_w8a8_block,torch.float16,20,2304,7168,256,8,128,128,ck,256,6389.1556
gfx936,int8_w8a8_block,torch.float16,21,2304,7168,256,8,128,128,ck,256,6198.0488
gfx936,int8_w8a8_block,torch.float16,22,2304,7168,256,8,128,128,ck,256,6704.2199
gfx936,int8_w8a8_block,torch.float16,23,2304,7168,256,8,128,128,ck,256,6957.5245
gfx936,int8_w8a8_block,torch.float16,24,2304,7168,256,8,128,128,ck,256,6653.9634
gfx936,int8_w8a8_block,torch.float16,25,2304,7168,256,8,128,128,ck,256,7419.4212
gfx936,int8_w8a8_block,torch.float16,26,2304,7168,256,8,128,128,ck,256,7740.734
gfx936,int8_w8a8_block,torch.float16,27,2304,7168,256,8,128,128,ck,256,7583.9258
gfx936,int8_w8a8_block,torch.float16,28,2304,7168,256,8,128,128,ck,256,8067.6719
gfx936,int8_w8a8_block,torch.float16,29,2304,7168,256,8,128,128,ck,256,7827.3022
gfx936,int8_w8a8_block,torch.float16,30,2304,7168,256,8,128,128,ck,256,8226.0128
gfx936,int8_w8a8_block,torch.float16,31,2304,7168,256,8,128,128,ck,256,8765.0934
gfx936,int8_w8a8_block,torch.float16,32,2304,7168,256,8,128,128,ck,256,8287.4442
gfx936,int8_w8a8_block,torch.float16,34,2304,7168,256,8,128,128,ck,256,9189.8303
gfx936,int8_w8a8_block,torch.float16,36,2304,7168,256,8,128,128,ck,256,9010.0497
gfx936,int8_w8a8_block,torch.float16,40,2304,7168,256,8,128,128,ck,256,9991.6976
gfx936,int8_w8a8_block,torch.float16,44,2304,7168,256,8,128,128,ck,256,10406.3407
gfx936,int8_w8a8_block,torch.float16,48,2304,7168,256,8,128,128,ck,256,10457.3132
gfx936,int8_w8a8_block,torch.float16,56,2304,7168,256,8,128,128,ck,256,10918.0446
gfx936,int8_w8a8_block,torch.float16,64,2304,7168,256,8,128,128,ck,256,12263.38
gfx936,int8_w8a8_block,torch.float16,68,2304,7168,256,8,128,128,ck,256,12388.0282
gfx936,int8_w8a8_block,torch.float16,72,2304,7168,256,8,128,128,ck,256,12684.0274
gfx936,int8_w8a8_block,torch.float16,80,2304,7168,256,8,128,128,ck,256,12786.4017
gfx936,int8_w8a8_block,torch.float16,88,2304,7168,256,8,128,128,ck,256,12816.288
gfx936,int8_w8a8_block,torch.float16,96,2304,7168,256,8,128,128,ck,256,13388.8676
gfx936,int8_w8a8_block,torch.float16,104,2304,7168,256,8,128,128,ck,256,13664.4714
gfx936,int8_w8a8_block,torch.float16,112,2304,7168,256,8,128,128,ck,1073741824,13843.4207
gfx936,int8_w8a8_block,torch.float16,128,2304,7168,256,8,128,128,ck,1073741824,14062.0561
gfx936,int8_w8a8_block,torch.float16,144,2304,7168,256,8,128,128,ck,1073741824,13992.1954
gfx936,int8_w8a8_block,torch.float16,160,2304,7168,256,8,128,128,ck,1073741824,14250.3336
gfx936,int8_w8a8_block,torch.float16,192,2304,7168,256,8,128,128,ck,1073741824,14385.9878
gfx936,int8_w8a8_block,torch.float16,224,2304,7168,256,8,128,128,ck,1073741824,14440.0596
gfx936,int8_w8a8_block,torch.float16,256,2304,7168,256,8,128,128,ck,1073741824,14530.2234
gfx936,int8_w8a8_block,torch.float16,320,2304,7168,256,8,128,128,ck,1073741824,14700.4377
gfx936,int8_w8a8_block,torch.float16,384,2304,7168,256,8,128,128,ck,1073741824,14808.9845
gfx936,int8_w8a8_block,torch.float16,448,2304,7168,256,8,128,128,ck,1073741824,14983.8729
gfx936,int8_w8a8_block,torch.float16,512,2304,7168,256,8,128,128,ck,1073741824,15144.0743
gfx936,int8_w8a8_block,torch.float16,768,2304,7168,256,8,128,128,ck,1073741824,16370.4801
gfx936,int8_w8a8_block,torch.float16,1024,2304,7168,256,8,128,128,ck,1073741824,22165.7068
gfx936,int8_w8a8_block,torch.float16,1024,2304,7168,256,8,128,128,ck,1073741824,22200.5112
gfx936,int8_w8a8_block,torch.float16,1152,2304,7168,256,8,128,128,ck,1073741824,26188.6939
gfx936,int8_w8a8_block,torch.float16,1,1536,4096,128,8,128,128,ck,256,291.658
gfx936,int8_w8a8_block,torch.float16,2,1536,4096,128,8,128,128,ck,256,409.0957
gfx936,int8_w8a8_block,torch.float16,3,1536,4096,128,8,128,128,ck,256,545.9305
gfx936,int8_w8a8_block,torch.float16,4,1536,4096,128,8,128,128,ck,256,680.0244
gfx936,int8_w8a8_block,torch.float16,5,1536,4096,128,8,128,128,ck,256,824.0053
gfx936,int8_w8a8_block,torch.float16,6,1536,4096,128,8,128,128,ck,256,961.9745
gfx936,int8_w8a8_block,torch.float16,7,1536,4096,128,8,128,128,ck,256,993.5245
gfx936,int8_w8a8_block,torch.float16,8,1536,4096,128,8,128,128,ck,256,1152.4533
gfx936,int8_w8a8_block,torch.float16,9,1536,4096,128,8,128,128,ck,256,1160.7529
gfx936,int8_w8a8_block,torch.float16,10,1536,4096,128,8,128,128,ck,256,1266.7067
gfx936,int8_w8a8_block,torch.float16,11,1536,4096,128,8,128,128,ck,256,1295.2701
gfx936,int8_w8a8_block,torch.float16,12,1536,4096,128,8,128,128,ck,256,1440.103
gfx936,int8_w8a8_block,torch.float16,13,1536,4096,128,8,128,128,ck,256,1697.6591
gfx936,int8_w8a8_block,torch.float16,14,1536,4096,128,8,128,128,ck,256,1745.6223
gfx936,int8_w8a8_block,torch.float16,15,1536,4096,128,8,128,128,ck,256,1710.5023
gfx936,int8_w8a8_block,torch.float16,16,1536,4096,128,8,128,128,ck,256,1852.1887
gfx936,int8_w8a8_block,torch.float16,17,1536,4096,128,8,128,128,ck,256,1831.4358
gfx936,int8_w8a8_block,torch.float16,18,1536,4096,128,8,128,128,ck,256,1838.3458
gfx936,int8_w8a8_block,torch.float16,19,1536,4096,128,8,128,128,ck,256,2021.7323000000001
gfx936,int8_w8a8_block,torch.float16,20,1536,4096,128,8,128,128,ck,256,2118.7607
gfx936,int8_w8a8_block,torch.float16,21,1536,4096,128,8,128,128,ck,256,2139.1852
gfx936,int8_w8a8_block,torch.float16,22,1536,4096,128,8,128,128,ck,256,2195.0414
gfx936,int8_w8a8_block,torch.float16,23,1536,4096,128,8,128,128,ck,256,2192.328
gfx936,int8_w8a8_block,torch.float16,24,1536,4096,128,8,128,128,ck,256,2440.6246
gfx936,int8_w8a8_block,torch.float16,25,1536,4096,128,8,128,128,ck,256,2200.6248
gfx936,int8_w8a8_block,torch.float16,26,1536,4096,128,8,128,128,ck,256,2218.4566
gfx936,int8_w8a8_block,torch.float16,27,1536,4096,128,8,128,128,ck,256,2453.0879
gfx936,int8_w8a8_block,torch.float16,28,1536,4096,128,8,128,128,ck,256,2350.3684
gfx936,int8_w8a8_block,torch.float16,29,1536,4096,128,8,128,128,ck,256,2476.5557
gfx936,int8_w8a8_block,torch.float16,30,1536,4096,128,8,128,128,ck,256,2487.2788
gfx936,int8_w8a8_block,torch.float16,31,1536,4096,128,8,128,128,ck,256,2440.2945
gfx936,int8_w8a8_block,torch.float16,32,1536,4096,128,8,128,128,ck,256,2470.9654
gfx936,int8_w8a8_block,torch.float16,34,1536,4096,128,8,128,128,ck,256,2640.585
gfx936,int8_w8a8_block,torch.float16,36,1536,4096,128,8,128,128,ck,256,2472.0041
gfx936,int8_w8a8_block,torch.float16,40,1536,4096,128,8,128,128,ck,256,2689.1661
gfx936,int8_w8a8_block,torch.float16,44,1536,4096,128,8,128,128,ck,256,2760.7251
gfx936,int8_w8a8_block,torch.float16,48,1536,4096,128,8,128,128,ck,256,2789.2965
gfx936,int8_w8a8_block,torch.float16,56,1536,4096,128,8,128,128,ck,256,2911.2359
gfx936,int8_w8a8_block,torch.float16,64,1536,4096,128,8,128,128,ck,256,2866.2659
gfx936,int8_w8a8_block,torch.float16,68,1536,4096,128,8,128,128,ck,256,2932.9077
gfx936,int8_w8a8_block,torch.float16,72,1536,4096,128,8,128,128,ck,256,2849.2279
gfx936,int8_w8a8_block,torch.float16,80,1536,4096,128,8,128,128,ck,256,2902.7918
gfx936,int8_w8a8_block,torch.float16,88,1536,4096,128,8,128,128,ck,1073741824,2991.5017
gfx936,int8_w8a8_block,torch.float16,96,1536,4096,128,8,128,128,ck,1073741824,3009.2322
gfx936,int8_w8a8_block,torch.float16,104,1536,4096,128,8,128,128,ck,1073741824,3010.9726
gfx936,int8_w8a8_block,torch.float16,112,1536,4096,128,8,128,128,ck,1073741824,3021.8461
gfx936,int8_w8a8_block,torch.float16,128,1536,4096,128,8,128,128,ck,1073741824,3042.2445
gfx936,int8_w8a8_block,torch.float16,144,1536,4096,128,8,128,128,ck,1073741824,3091.5212
gfx936,int8_w8a8_block,torch.float16,160,1536,4096,128,8,128,128,ck,1073741824,3116.5366
gfx936,int8_w8a8_block,torch.float16,192,1536,4096,128,8,128,128,ck,1073741824,3152.8336
gfx936,int8_w8a8_block,torch.float16,224,1536,4096,128,8,128,128,ck,1073741824,3192.8889
gfx936,int8_w8a8_block,torch.float16,256,1536,4096,128,8,128,128,ck,1073741824,3223.7425
gfx936,int8_w8a8_block,torch.float16,320,1536,4096,128,8,128,128,ck,1073741824,3282.5084
gfx936,int8_w8a8_block,torch.float16,384,1536,4096,128,8,128,128,ck,1073741824,3431.9543
gfx936,int8_w8a8_block,torch.float16,448,1536,4096,128,8,128,128,ck,1073741824,3855.0492
gfx936,int8_w8a8_block,torch.float16,512,1536,4096,128,8,128,128,ck,1073741824,4436.9874
gfx936,int8_w8a8_block,torch.float16,768,1536,4096,128,8,128,128,ck,1073741824,5567.0914
gfx936,int8_w8a8_block,torch.float16,1024,1536,4096,128,8,128,128,ck,1073741824,6996.0452
gfx936,int8_w8a8_block,torch.float16,1024,1536,4096,128,8,128,128,ck,1073741824,6939.3137
gfx936,int8_w8a8_block,torch.float16,1152,1536,4096,128,8,128,128,ck,1073741824,7784.7617
quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k
int8_w8a8_block,torch.float16,1,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,2,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,3,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,4,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,5,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,6,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,7,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,8,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,9,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,10,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,11,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,12,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,13,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,14,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,15,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,16,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,17,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,18,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,19,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,20,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,21,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,22,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,23,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,24,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,25,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,26,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,27,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,28,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,29,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,30,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,31,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,32,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,34,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,36,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,40,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,44,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,48,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,56,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,64,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,68,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,72,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,80,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,88,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,96,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,104,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,112,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,128,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,144,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,160,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,192,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,224,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,256,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,320,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,384,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,448,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,512,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,768,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,1024,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,1024,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,1152,256,7168,256,8,128,128
int8_w8a8_block,torch.float16,1,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,2,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,3,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,4,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,5,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,6,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,7,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,8,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,9,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,10,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,11,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,12,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,13,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,14,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,15,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,16,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,17,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,18,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,19,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,20,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,21,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,22,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,23,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,24,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,25,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,26,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,27,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,28,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,29,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,30,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,31,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,32,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,34,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,36,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,40,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,44,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,48,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,56,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,64,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,68,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,72,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,80,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,88,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,96,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,104,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,112,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,128,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,144,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,160,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,192,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,224,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,256,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,320,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,384,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,448,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,512,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,768,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,1024,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,1024,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,1152,2304,7168,256,8,128,128
int8_w8a8_block,torch.float16,1,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,2,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,3,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,4,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,5,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,6,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,7,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,8,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,9,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,10,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,11,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,12,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,13,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,14,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,15,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,16,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,17,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,18,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,19,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,20,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,21,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,22,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,23,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,24,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,25,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,26,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,27,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,28,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,29,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,30,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,31,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,32,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,34,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,36,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,40,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,44,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,48,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,56,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,64,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,68,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,72,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,80,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,88,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,96,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,104,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,112,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,128,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,144,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,160,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,192,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,224,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,256,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,320,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,384,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,448,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,512,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,768,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,1024,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,1024,1536,4096,128,8,128,128
int8_w8a8_block,torch.float16,1152,1536,4096,128,8,128,128
token,model_dim,inter_dim,expert,topk,act_type,dtype,q_dtype_a,q_dtype_w,q_type,use_g1u1,doweight_stage1,block_m,ksplit,us,tag,err
256,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_128x128,1,0,32,0,270.8542,fmoe_stage1_bf16_pertokenFp8_blockscale_g1u1_32x512_pf2,1.6%
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Tensor,1,0,64,0,346.93691000000007,fmoe_stage1_bf16_pertokenInt8_g1u1_64x256_pf3,0.0%
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Token,1,0,64,0,340.65007,fmoe_stage1_bf16_pertokenInt8_g1u1_64x256_pf3,0.0%
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0,64,0,336.42205,fmoe_stage1_bf16_pertokenFp8_g1u1_64x256_pf3,0.0%
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.int4,QuantType.per_Tensor,1,0,128,0,699.5049699999998,ck_128,0.1%
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Tensor,1,0,64,0,347.0561,fmoe_stage1_bf16_pertokenInt8_g1u1_64x256_pf3,0.0%
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Token,1,0,64,0,334.47364,fmoe_stage1_bf16_pertokenInt8_g1u1_64x256_pf3,0.0%
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0,64,0,357.0689999999998,fmoe_stage1_bf16_pertokenFp8_g1u1_64x128_2tg_pf3,0.0%
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.int4,QuantType.per_Tensor,1,0,128,0,837.6014699999998,ck_128,0.0%
4,2304,1536,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0,32,0,18.364460000000005,fmoe_stage1_bf16_pertokenFp8_g1u1_32x64_4tg_pf3,0.0%
4,2304,1536,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,1,32,0,19.47728,fmoe_stage1_bf16_pertokenFp8_doweight_g1u1_32x64_4tg_pf3,0.0%
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx938,no_quant,torch.float16,1,352,4096,128,8,0,0,asm,10008+20000,76.1135
gfx938,no_quant,torch.float16,2,352,4096,128,8,0,0,asm,10011+20002,116.9911
gfx938,no_quant,torch.float16,4,352,4096,128,8,0,0,asm,10002+20000,190.2544
gfx938,no_quant,torch.float16,6,352,4096,128,8,0,0,asm,10011+20000,255.6735
gfx938,no_quant,torch.float16,8,352,4096,128,8,0,0,asm,10002+20000,327.9644
gfx938,no_quant,torch.float16,10,352,4096,128,8,0,0,asm,10002+20000,381.3467
gfx938,no_quant,torch.float16,12,352,4096,128,8,0,0,asm,10002+20000,425.2932
gfx938,no_quant,torch.float16,14,352,4096,128,8,0,0,asm,10002+20000,466.8067
gfx938,no_quant,torch.float16,16,352,4096,128,8,0,0,asm,10002+20000,502.9911
gfx938,no_quant,torch.float16,20,352,4096,128,8,0,0,asm,10002+20000,559.3775
gfx938,no_quant,torch.float16,24,352,4096,128,8,0,0,asm,10002+20000,579.1763
gfx938,no_quant,torch.float16,28,352,4096,128,8,0,0,asm,10002+20000,598.1905
gfx938,no_quant,torch.float16,32,352,4096,128,8,0,0,asm,10002+20000,617.1032
gfx938,no_quant,torch.float16,36,352,4096,128,8,0,0,asm,10002+20000,634.1831
gfx938,no_quant,torch.float16,40,352,4096,128,8,0,0,asm,10002+20000,650.6875
gfx938,no_quant,torch.float16,44,352,4096,128,8,0,0,asm,10002+20000,673.797
gfx938,no_quant,torch.float16,48,352,4096,128,8,0,0,asm,10002+20000,688.9969
gfx938,no_quant,torch.float16,56,352,4096,128,8,0,0,asm,10002+20000,690.6337
gfx938,no_quant,torch.float16,64,352,4096,128,8,0,0,asm,10002+20000,705.25
gfx938,no_quant,torch.float16,68,352,4096,128,8,0,0,asm,10002+20000,692.6071
gfx938,no_quant,torch.float16,72,352,4096,128,8,0,0,asm,10002+20000,693.4728
gfx938,no_quant,torch.float16,80,352,4096,128,8,0,0,asm,10002+20000,693.0667
gfx938,no_quant,torch.float16,88,352,4096,128,8,0,0,asm,10002+20000,698.6174
gfx938,no_quant,torch.float16,96,352,4096,128,8,0,0,asm,10002+20000,701.0585
gfx938,no_quant,torch.float16,104,352,4096,128,8,0,0,asm,10002+20000,700.9929
gfx938,no_quant,torch.float16,112,352,4096,128,8,0,0,asm,10002+20000,702.7078
gfx938,no_quant,torch.float16,128,352,4096,128,8,0,0,asm,10002+20000,706.9581
gfx938,no_quant,torch.float16,144,352,4096,128,8,0,0,asm,10002+20000,729.0544
gfx938,no_quant,torch.float16,160,352,4096,128,8,0,0,asm,10002+20000,722.2728
gfx938,no_quant,torch.float16,192,352,4096,128,8,0,0,asm,10011+20000,742.4902
gfx938,no_quant,torch.float16,224,352,4096,128,8,0,0,asm,11004+21001,774.5392
gfx938,no_quant,torch.float16,256,352,4096,128,8,0,0,asm,11004+21001,780.4756
gfx938,no_quant,torch.float16,320,352,4096,128,8,0,0,asm,11004+21001,796.5904
gfx938,no_quant,torch.float16,384,352,4096,128,8,0,0,asm,11005+21001,804.2211
gfx938,no_quant,torch.float16,448,352,4096,128,8,0,0,asm,12005+22001,833.0702
gfx938,no_quant,torch.float16,512,352,4096,128,8,0,0,asm,12005+22001,847.1173
gfx938,no_quant,torch.float16,576,352,4096,128,8,0,0,asm,12005+22001,857.4557
gfx938,no_quant,torch.float16,640,352,4096,128,8,0,0,asm,12005+22001,867.1542
gfx938,no_quant,torch.float16,704,352,4096,128,8,0,0,asm,12005+22001,878.2925
gfx938,no_quant,torch.float16,768,352,4096,128,8,0,0,asm,12005+22001,890.8995
gfx938,no_quant,torch.float16,832,352,4096,128,8,0,0,asm,12005+22001,900.5198
gfx938,no_quant,torch.float16,896,352,4096,128,8,0,0,asm,12001+22001,958.5009
gfx938,no_quant,torch.float16,960,352,4096,128,8,0,0,asm,12003+22001,985.6514
gfx938,no_quant,torch.float16,1024,352,4096,128,8,0,0,asm,13001+23001,1062.3093
gfx938,no_quant,torch.float16,1152,352,4096,128,8,0,0,asm,13001+23001,1079.7408
gfx938,no_quant,torch.float16,1280,352,4096,128,8,0,0,asm,13001+23001,1090.4801
gfx938,no_quant,torch.float16,1408,352,4096,128,8,0,0,asm,13001+23001,1110.9976
gfx938,no_quant,torch.float16,1536,352,4096,128,8,0,0,asm,13001+23001,1123.6784
gfx938,no_quant,torch.float16,1664,352,4096,128,8,0,0,asm,13001+23001,1141.3393
gfx938,no_quant,torch.float16,1792,352,4096,128,8,0,0,asm,13001+23001,1163.7203
gfx938,no_quant,torch.float16,1920,352,4096,128,8,0,0,asm,13001+23001,1304.7715
gfx938,no_quant,torch.float16,2048,352,4096,128,8,0,0,asm,13001+23001,1584.7923
gfx938,no_quant,torch.float16,2304,352,4096,128,8,0,0,asm,13001+23001,1943.0033
gfx938,no_quant,torch.float16,2560,352,4096,128,8,0,0,asm,13001+23001,1988.7219
gfx938,no_quant,torch.float16,2816,352,4096,128,8,0,0,asm,13001+23001,2026.4655
gfx938,no_quant,torch.float16,3072,352,4096,128,8,0,0,asm,13001+23001,2056.3481
gfx938,no_quant,torch.float16,3328,352,4096,128,8,0,0,asm,13001+23001,2081.0787
gfx938,no_quant,torch.float16,3584,352,4096,128,8,0,0,asm,13001+23001,2113.5351
gfx938,no_quant,torch.float16,3840,352,4096,128,8,0,0,asm,13001+23001,2251.9895
gfx938,no_quant,torch.float16,4096,352,4096,128,8,0,0,asm,13001+23001,2568.3675
gfx938,no_quant,torch.float16,5120,352,4096,128,8,0,0,asm,13001+23001,3066.6487
gfx938,no_quant,torch.float16,6144,352,4096,128,8,0,0,asm,13001+23001,3581.1465
gfx938,no_quant,torch.float16,7168,352,4096,128,8,0,0,asm,13001+23001,4122.1716
gfx938,no_quant,torch.float16,7680,352,4096,128,8,0,0,asm,13001+23001,4222.0785
gfx938,no_quant,torch.float16,8192,352,4096,128,8,0,0,asm,13001+23001,4607.7508
gfx938,no_quant,torch.float16,10240,352,4096,128,8,0,0,asm,13001+23001,5676.0447
gfx938,no_quant,torch.float16,12288,352,4096,128,8,0,0,asm,13001+23001,6679.6272
gfx938,no_quant,torch.float16,14336,352,4096,128,8,0,0,asm,13001+23001,7789.8272
gfx938,no_quant,torch.float16,16384,352,4096,128,8,0,0,asm,13001+23001,8726.181
gfx938,no_quant,torch.float16,17408,352,4096,128,8,0,0,asm,13001+23001,9263.6738
gfx938,no_quant,torch.float16,24576,352,4096,128,8,0,0,asm,13001+23001,12830.282
gfx938,no_quant,torch.float16,32768,352,4096,128,8,0,0,asm,13001+23001,17031.4351
gfx938,no_quant,torch.float16,40960,352,4096,128,8,0,0,asm,13001+23001,21120.0199
gfx938,no_quant,torch.float16,49152,352,4096,128,8,0,0,asm,13001+23001,25184.3324
gfx938,no_quant,torch.float16,57344,352,4096,128,8,0,0,asm,13001+23001,29341.3454
gfx938,no_quant,torch.float16,65536,352,4096,128,8,0,0,asm,13001+23001,33437.6425
gfx938,no_quant,torch.float16,1,352,4096,129,9,0,0,asm,10008+20000,79.718
gfx938,no_quant,torch.float16,2,352,4096,129,9,0,0,asm,10011+20002,118.7885
gfx938,no_quant,torch.float16,4,352,4096,129,9,0,0,asm,10002+20000,196.5523
gfx938,no_quant,torch.float16,6,352,4096,129,9,0,0,asm,10011+20000,270.1234
gfx938,no_quant,torch.float16,8,352,4096,129,9,0,0,asm,10002+20000,322.2257
gfx938,no_quant,torch.float16,10,352,4096,129,9,0,0,asm,10002+20000,379.8174
gfx938,no_quant,torch.float16,12,352,4096,129,9,0,0,asm,10002+20000,416.2644
gfx938,no_quant,torch.float16,14,352,4096,129,9,0,0,asm,10002+20000,457.8191
gfx938,no_quant,torch.float16,16,352,4096,129,9,0,0,asm,10002+20000,493.3677
gfx938,no_quant,torch.float16,20,352,4096,129,9,0,0,asm,10002+20000,562.0455
gfx938,no_quant,torch.float16,24,352,4096,129,9,0,0,asm,10002+20000,609.2494
gfx938,no_quant,torch.float16,28,352,4096,129,9,0,0,asm,10002+20000,639.2872
gfx938,no_quant,torch.float16,32,352,4096,129,9,0,0,asm,10002+20000,650.7579
gfx938,no_quant,torch.float16,36,352,4096,129,9,0,0,asm,10002+20000,680.4902
gfx938,no_quant,torch.float16,40,352,4096,129,9,0,0,asm,10002+20000,686.082
gfx938,no_quant,torch.float16,48,352,4096,129,9,0,0,asm,10002+20000,712.4491
gfx938,no_quant,torch.float16,56,352,4096,129,9,0,0,asm,10002+20000,710.9639
gfx938,no_quant,torch.float16,64,352,4096,129,9,0,0,asm,10002+20000,730.5607
gfx938,no_quant,torch.float16,72,352,4096,129,9,0,0,asm,10002+20000,718.7957
gfx938,no_quant,torch.float16,80,352,4096,129,9,0,0,asm,10002+20000,720.0142
gfx938,no_quant,torch.float16,88,352,4096,129,9,0,0,asm,10002+20000,722.9229
gfx938,no_quant,torch.float16,96,352,4096,129,9,0,0,asm,10002+20000,723.0624
gfx938,no_quant,torch.float16,104,352,4096,129,9,0,0,asm,10002+20000,724.0839
gfx938,no_quant,torch.float16,112,352,4096,129,9,0,0,asm,10002+20000,735.3413
gfx938,no_quant,torch.float16,128,352,4096,129,9,0,0,asm,10002+20000,737.2243
gfx938,no_quant,torch.float16,144,352,4096,129,9,0,0,asm,10002+20000,754.1186
gfx938,no_quant,torch.float16,160,352,4096,129,9,0,0,asm,10002+20000,753.3679
gfx938,no_quant,torch.float16,192,352,4096,129,9,0,0,asm,10002+20000,788.8426
gfx938,no_quant,torch.float16,224,352,4096,129,9,0,0,asm,11004+21001,801.5606
gfx938,no_quant,torch.float16,256,352,4096,129,9,0,0,asm,11004+21001,807.7226
gfx938,no_quant,torch.float16,320,352,4096,129,9,0,0,asm,11004+21001,826.3646
gfx938,no_quant,torch.float16,384,352,4096,129,9,0,0,asm,12005+22001,854.2537
gfx938,no_quant,torch.float16,448,352,4096,129,9,0,0,asm,12005+22001,864.8998
gfx938,no_quant,torch.float16,512,352,4096,129,9,0,0,asm,12005+22001,883.4228
gfx938,no_quant,torch.float16,576,352,4096,129,9,0,0,asm,12005+22001,895.6977
gfx938,no_quant,torch.float16,640,352,4096,129,9,0,0,asm,12001+22001,908.3787
gfx938,no_quant,torch.float16,768,352,4096,129,9,0,0,asm,12001+22001,915.4966
gfx938,no_quant,torch.float16,960,352,4096,129,9,0,0,asm,13001+23001,1079.7907
gfx938,no_quant,torch.float16,1024,352,4096,129,9,0,0,asm,13001+23001,1088.9094
gfx938,no_quant,torch.float16,1280,352,4096,129,9,0,0,asm,13001+23001,1129.3092
gfx938,no_quant,torch.float16,1536,352,4096,129,9,0,0,asm,13001+23001,1169.2723
gfx938,no_quant,torch.float16,1920,352,4096,129,9,0,0,asm,13001+23001,1764.185
gfx938,no_quant,torch.float16,2048,352,4096,129,9,0,0,asm,13001+23001,1934.3223
gfx938,no_quant,torch.float16,2304,352,4096,129,9,0,0,asm,13001+23001,2006.923
gfx938,no_quant,torch.float16,2560,352,4096,129,9,0,0,asm,13001+23001,2035.540
gfx938,no_quant,torch.float16,2816,352,4096,129,9,0,0,asm,13001+23001,2068.5062
gfx938,no_quant,torch.float16,3072,352,4096,129,9,0,0,asm,13001+23001,2102.0827
gfx938,no_quant,torch.float16,3584,352,4096,129,9,0,0,asm,13001+23001,2447.431
gfx938,no_quant,torch.float16,3840,352,4096,129,9,0,0,asm,13001+23001,2805.2093
gfx938,no_quant,torch.float16,4096,352,4096,129,9,0,0,asm,13001+23001,3007.0664
gfx938,no_quant,torch.float16,4608,352,4096,129,9,0,0,asm,13001+23001,3123.0345
gfx938,no_quant,torch.float16,5120,352,4096,129,9,0,0,asm,13001+23001,3246.8705
gfx938,no_quant,torch.float16,5632,352,4096,129,9,0,0,asm,13001+23001,3764.9074
gfx938,no_quant,torch.float16,6144,352,4096,129,9,0,0,asm,13001+23001,4092.9607
gfx938,no_quant,torch.float16,6656,352,4096,129,9,0,0,asm,13001+23001,4175.6811
gfx938,no_quant,torch.float16,7168,352,4096,129,9,0,0,asm,13001+23001,4504.6947
gfx938,no_quant,torch.float16,7680,352,4096,129,9,0,0,asm,13001+23001,5027.1321
gfx938,no_quant,torch.float16,8192,352,4096,129,9,0,0,asm,13001+23001,5169.6112
gfx938,no_quant,torch.float16,10240,352,4096,129,9,0,0,asm,13001+23001,6238.8422
gfx938,no_quant,torch.float16,12288,352,4096,129,9,0,0,asm,13001+23001,7419.1773
gfx938,no_quant,torch.float16,16384,352,4096,129,9,0,0,asm,13001+23001,9753.8878
gfx938,no_quant,torch.float16,24576,352,4096,129,9,0,0,asm,13001+23001,14398.8284
gfx938,no_quant,torch.float16,32768,352,4096,129,9,0,0,asm,13001+23001,19058.7232
gfx938,no_quant,torch.float16,40960,352,4096,129,9,0,0,asm,13001+23001,23722.1115
gfx938,no_quant,torch.float16,49152,352,4096,129,9,0,0,asm,13001+23001,28329.0767
gfx938,no_quant,torch.float16,65536,352,4096,129,9,0,0,asm,13001+23001,37562.0269
gfx936,no_quant,torch.float16,1,256,3072,256,8,0,0,asm,10002+20000,55.456
gfx936,no_quant,torch.float16,2,256,3072,256,8,0,0,asm,10002+20000,86.6223
gfx936,no_quant,torch.float16,4,256,3072,256,8,0,0,asm,10002+20000,155.6412
gfx936,no_quant,torch.float16,6,256,3072,256,8,0,0,asm,10001+20000,212.4495
gfx936,no_quant,torch.float16,8,256,3072,256,8,0,0,asm,10001+20000,258.5125
gfx936,no_quant,torch.float16,12,256,3072,256,8,0,0,asm,10001+20000,349.5272
gfx936,no_quant,torch.float16,16,256,3072,256,8,0,0,asm,10001+20000,424.9797
gfx936,no_quant,torch.float16,24,256,3072,256,8,0,0,asm,10001+20000,569.7428
gfx936,no_quant,torch.float16,32,256,3072,256,8,0,0,asm,10001+20000,698.3014
gfx936,no_quant,torch.float16,36,256,3072,256,8,0,0,asm,10001+20000,731.8899
gfx936,no_quant,torch.float16,48,256,3072,256,8,0,0,asm,10001+20000,823.0646
gfx936,no_quant,torch.float16,56,256,3072,256,8,0,0,asm,10001+20000,869.7846
gfx936,no_quant,torch.float16,64,256,3072,256,8,0,0,asm,10001+20000,902.1634
gfx936,no_quant,torch.float16,72,256,3072,256,8,0,0,asm,10001+20000,939.9486
gfx936,no_quant,torch.float16,80,256,3072,256,8,0,0,asm,10001+20000,966.9634
gfx936,no_quant,torch.float16,88,256,3072,256,8,0,0,asm,10001+20000,994.9044
gfx936,no_quant,torch.float16,96,256,3072,256,8,0,0,asm,10001+20000,1011.3254
gfx936,no_quant,torch.float16,100,256,3072,256,8,0,0,asm,10001+20000,1012.3611
gfx936,no_quant,torch.float16,112,256,3072,256,8,0,0,asm,10001+20000,1031.8055
gfx936,no_quant,torch.float16,128,256,3072,256,8,0,0,asm,10001+20000,1058.5927
gfx936,no_quant,torch.float16,144,256,3072,256,8,0,0,asm,10001+20000,1068.6726
gfx936,no_quant,torch.float16,160,256,3072,256,8,0,0,asm,10001+20000,1079.586
gfx936,no_quant,torch.float16,192,256,3072,256,8,0,0,asm,10001+20000,1096.3268
gfx936,no_quant,torch.float16,224,256,3072,256,8,0,0,asm,10001+20000,1111.8469
gfx936,no_quant,torch.float16,256,256,3072,256,8,0,0,asm,10001+20000,1125.3208
gfx936,no_quant,torch.float16,320,256,3072,256,8,0,0,asm,10001+20000,1151.3166
gfx936,no_quant,torch.float16,384,256,3072,256,8,0,0,asm,10002+20000,1176.2598
gfx936,no_quant,torch.float16,448,256,3072,256,8,0,0,asm,10002+20000,1216.6051
gfx936,no_quant,torch.float16,512,256,3072,256,8,0,0,asm,12005+22001,1234.8115
gfx936,no_quant,torch.float16,640,256,3072,256,8,0,0,asm,12005+22001,1258.5252
gfx936,no_quant,torch.float16,768,256,3072,256,8,0,0,asm,12005+22001,1282.3315
gfx936,no_quant,torch.float16,896,256,3072,256,8,0,0,asm,12005+22001,1306.7272
gfx936,no_quant,torch.float16,1024,256,3072,256,8,0,0,asm,12005+22001,1334.2219
gfx936,no_quant,torch.float16,1280,256,3072,256,8,0,0,asm,12005+22001,1376.8577
gfx936,no_quant,torch.float16,1536,256,3072,256,8,0,0,asm,12005+22001,1437.6745
gfx936,no_quant,torch.float16,2048,256,3072,256,8,0,0,asm,13001+23001,1541.6658
gfx936,no_quant,torch.float16,2304,256,3072,256,8,0,0,asm,13001+23001,1576.0315
gfx936,no_quant,torch.float16,2560,256,3072,256,8,0,0,asm,13001+23001,1624.385
gfx936,no_quant,torch.float16,3072,256,3072,256,8,0,0,asm,13001+23001,1700.9494
gfx936,no_quant,torch.float16,3584,256,3072,256,8,0,0,asm,13001+23001,1818.2295
gfx936,no_quant,torch.float16,4096,256,3072,256,8,0,0,asm,13001+23001,1965.16
gfx936,no_quant,torch.float16,5120,256,3072,256,8,0,0,asm,13001+23001,2322.7428
gfx936,no_quant,torch.float16,6144,256,3072,256,8,0,0,asm,13001+23001,2458.768
gfx936,no_quant,torch.float16,7168,256,3072,256,8,0,0,asm,13001+23001,2695.1215
gfx936,no_quant,torch.float16,8192,256,3072,256,8,0,0,asm,13001+23001,3011.6433
gfx936,no_quant,torch.float16,10240,256,3072,256,8,0,0,asm,13001+23001,3578.2532
gfx936,no_quant,torch.float16,12288,256,3072,256,8,0,0,asm,13001+23001,4153.0568
gfx936,no_quant,torch.float16,16384,256,3072,256,8,0,0,asm,13001+23001,5263.1272
gfx936,no_quant,torch.float16,24576,256,3072,256,8,0,0,asm,13001+23001,7644.2697
gfx936,no_quant,torch.float16,32768,256,3072,256,8,0,0,asm,13001+23001,10052.4186
gfx936,no_quant,torch.float16,1,128,3072,256,8,0,0,asm,10000+20000,41.3928
gfx936,no_quant,torch.float16,2,128,3072,256,8,0,0,asm,10002+20000,57.1149
gfx936,no_quant,torch.float16,4,128,3072,256,8,0,0,asm,10002+20002,89.8055
gfx936,no_quant,torch.float16,6,128,3072,256,8,0,0,asm,10002+20002,119.0938
gfx936,no_quant,torch.float16,8,128,3072,256,8,0,0,asm,10002+20000,144.6431
gfx936,no_quant,torch.float16,12,128,3072,256,8,0,0,asm,10002+20000,194.622
gfx936,no_quant,torch.float16,16,128,3072,256,8,0,0,asm,10001+20000,235.6157
gfx936,no_quant,torch.float16,24,128,3072,256,8,0,0,asm,10001+20000,306.181
gfx936,no_quant,torch.float16,32,128,3072,256,8,0,0,asm,10001+20002,378.7229
gfx936,no_quant,torch.float16,36,128,3072,256,8,0,0,asm,10001+20002,388.2777
gfx936,no_quant,torch.float16,48,128,3072,256,8,0,0,asm,10001+20000,433.7514
gfx936,no_quant,torch.float16,56,128,3072,256,8,0,0,asm,10001+20000,457.8524
gfx936,no_quant,torch.float16,64,128,3072,256,8,0,0,asm,10001+20002,475.2419
gfx936,no_quant,torch.float16,72,128,3072,256,8,0,0,asm,10001+20002,493.6672
gfx936,no_quant,torch.float16,80,128,3072,256,8,0,0,asm,10001+20002,507.8987
gfx936,no_quant,torch.float16,88,128,3072,256,8,0,0,asm,10001+20002,524.2018
gfx936,no_quant,torch.float16,96,128,3072,256,8,0,0,asm,10001+20002,531.7892
gfx936,no_quant,torch.float16,100,128,3072,256,8,0,0,asm,10001+20002,532.3534
gfx936,no_quant,torch.float16,112,128,3072,256,8,0,0,asm,10001+20002,543.4018
gfx936,no_quant,torch.float16,128,128,3072,256,8,0,0,asm,10001+20002,556.3197
gfx936,no_quant,torch.float16,144,128,3072,256,8,0,0,asm,10001+20002,562.2986
gfx936,no_quant,torch.float16,160,128,3072,256,8,0,0,asm,10001+20000,569.8103
gfx936,no_quant,torch.float16,192,128,3072,256,8,0,0,asm,10001+20002,577.9871
gfx936,no_quant,torch.float16,224,128,3072,256,8,0,0,asm,10001+20002,588.0249
gfx936,no_quant,torch.float16,256,128,3072,256,8,0,0,asm,10001+20002,595.6291
gfx936,no_quant,torch.float16,320,128,3072,256,8,0,0,asm,10001+20002,610.5007
gfx936,no_quant,torch.float16,384,128,3072,256,8,0,0,asm,10002+20002,625.9365
gfx936,no_quant,torch.float16,448,128,3072,256,8,0,0,asm,11007+21001,636.3196
gfx936,no_quant,torch.float16,512,128,3072,256,8,0,0,asm,11007+21001,649.5155
gfx936,no_quant,torch.float16,640,128,3072,256,8,0,0,asm,11004+21001,690.1469
gfx936,no_quant,torch.float16,768,128,3072,256,8,0,0,asm,11006+21001,706.9048
gfx936,no_quant,torch.float16,896,128,3072,256,8,0,0,asm,11007+21001,707.7806
gfx936,no_quant,torch.float16,1024,128,3072,256,8,0,0,asm,11005+21001,737.069
gfx936,no_quant,torch.float16,1280,128,3072,256,8,0,0,asm,12005+22001,785.271
gfx936,no_quant,torch.float16,1536,128,3072,256,8,0,0,asm,12004+22001,845.0015
gfx936,no_quant,torch.float16,2048,128,3072,256,8,0,0,asm,12001+22001,926.7277
gfx936,no_quant,torch.float16,2304,128,3072,256,8,0,0,asm,13001+23001,967.7214
gfx936,no_quant,torch.float16,2560,128,3072,256,8,0,0,asm,13001+23001,993.0266
gfx936,no_quant,torch.float16,3072,128,3072,256,8,0,0,asm,13001+23001,1061.8433
gfx936,no_quant,torch.float16,3584,128,3072,256,8,0,0,asm,13001+23001,1178.6685
gfx936,no_quant,torch.float16,4096,128,3072,256,8,0,0,asm,13001+23001,1286.8873
gfx936,no_quant,torch.float16,5120,128,3072,256,8,0,0,asm,13001+23001,1546.3902
gfx936,no_quant,torch.float16,6144,128,3072,256,8,0,0,asm,13001+23001,1648.3774
gfx936,no_quant,torch.float16,7168,128,3072,256,8,0,0,asm,13001+23001,1815.4257
gfx936,no_quant,torch.float16,8192,128,3072,256,8,0,0,asm,13001+23001,2049.7412
gfx936,no_quant,torch.float16,10240,128,3072,256,8,0,0,asm,13001+23001,2439.6861
gfx936,no_quant,torch.float16,12288,128,3072,256,8,0,0,asm,13001+23001,2854.5487
gfx936,no_quant,torch.float16,16384,128,3072,256,8,0,0,asm,13001+23001,3669.7898
gfx936,no_quant,torch.float16,24576,128,3072,256,8,0,0,asm,13001+23001,5322.7565
gfx936,no_quant,torch.float16,32768,128,3072,256,8,0,0,asm,13001+23001,7028.0263
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx938,no_quant,torch.float16,1,352,4096,128,8,0,0,asm,10009+20000,78.6408
gfx938,no_quant,torch.float16,2,352,4096,128,8,0,0,asm,10004+20002,117.1482
gfx938,no_quant,torch.float16,4,352,4096,128,8,0,0,asm,10006+20002,181.0486
gfx938,no_quant,torch.float16,6,352,4096,128,8,0,0,asm,10006+20000,236.5396
gfx938,no_quant,torch.float16,8,352,4096,128,8,0,0,asm,10007+20000,291.5917
gfx938,no_quant,torch.float16,10,352,4096,128,8,0,0,asm,10006+20000,336.7976
gfx938,no_quant,torch.float16,12,352,4096,128,8,0,0,asm,10006+20000,370.9924
gfx938,no_quant,torch.float16,16,352,4096,128,8,0,0,asm,10006+20000,436.4362
gfx938,no_quant,torch.float16,20,352,4096,128,8,0,0,asm,10006+20000,490.3447
gfx938,no_quant,torch.float16,24,352,4096,128,8,0,0,asm,10006+20000,508.1621
gfx938,no_quant,torch.float16,32,352,4096,128,8,0,0,asm,10007+20000,537.4327
gfx938,no_quant,torch.float16,36,352,4096,128,8,0,0,asm,10007+20000,556.2111
gfx938,no_quant,torch.float16,40,352,4096,128,8,0,0,asm,10006+20000,572.0756
gfx938,no_quant,torch.float16,48,352,4096,128,8,0,0,asm,10006+20000,606.7093
gfx938,no_quant,torch.float16,56,352,4096,128,8,0,0,asm,10006+20000,608.8057
gfx938,no_quant,torch.float16,64,352,4096,128,8,0,0,asm,10007+20000,618.06
gfx938,no_quant,torch.float16,72,352,4096,128,8,0,0,asm,10006+20000,612.0755
gfx938,no_quant,torch.float16,80,352,4096,128,8,0,0,asm,10006+20000,615.2016
gfx938,no_quant,torch.float16,88,352,4096,128,8,0,0,asm,10006+20000,620.6252
gfx938,no_quant,torch.float16,96,352,4096,128,8,0,0,asm,10006+20000,622.9226
gfx938,no_quant,torch.float16,112,352,4096,128,8,0,0,asm,10006+20000,625.9872
gfx938,no_quant,torch.float16,128,352,4096,128,8,0,0,asm,10007+20000,631.9154
gfx938,no_quant,torch.float16,144,352,4096,128,8,0,0,asm,10006+20000,648.1697
gfx938,no_quant,torch.float16,160,352,4096,128,8,0,0,asm,10006+20000,648.3789
gfx938,no_quant,torch.float16,192,352,4096,128,8,0,0,asm,10007+20000,667.0865
gfx938,no_quant,torch.float16,224,352,4096,128,8,0,0,asm,11004+21001,679.0988
gfx938,no_quant,torch.float16,256,352,4096,128,8,0,0,asm,11002+21001,691.788
gfx938,no_quant,torch.float16,320,352,4096,128,8,0,0,asm,11004+21001,704.5919
gfx938,no_quant,torch.float16,384,352,4096,128,8,0,0,asm,11004+21001,724.2637
gfx938,no_quant,torch.float16,512,352,4096,128,8,0,0,asm,12000+22001,774.9958
gfx938,no_quant,torch.float16,640,352,4096,128,8,0,0,asm,12000+22001,799.6931
gfx938,no_quant,torch.float16,768,352,4096,128,8,0,0,asm,12004+22001,822.5894
gfx938,no_quant,torch.float16,960,352,4096,128,8,0,0,asm,12005+22001,900.0783
gfx938,no_quant,torch.float16,1024,352,4096,128,8,0,0,asm,12005+22001,947.0566
gfx938,no_quant,torch.float16,1152,352,4096,128,8,0,0,asm,13001+23001,1047.4336
gfx938,no_quant,torch.float16,1280,352,4096,128,8,0,0,asm,13001+23001,1077.3083
gfx938,no_quant,torch.float16,1408,352,4096,128,8,0,0,asm,13001+23001,1088.9267
gfx938,no_quant,torch.float16,1536,352,4096,128,8,0,0,asm,13001+23001,1121.5625
gfx938,no_quant,torch.float16,2048,352,4096,128,8,0,0,asm,13001+23001,1410.5335
gfx938,no_quant,torch.float16,2304,352,4096,128,8,0,0,asm,12001+22001,1612.1491
gfx938,no_quant,torch.float16,2560,352,4096,128,8,0,0,asm,12001+22001,1651.5132
gfx938,no_quant,torch.float16,2816,352,4096,128,8,0,0,asm,12001+22001,1739.7137
gfx938,no_quant,torch.float16,3072,352,4096,128,8,0,0,asm,13001+23001,1789.1421
gfx938,no_quant,torch.float16,3840,352,4096,128,8,0,0,asm,13001+23001,1984.0983
gfx938,no_quant,torch.float16,4096,352,4096,128,8,0,0,asm,13001+23001,2248.1545
gfx938,no_quant,torch.float16,5120,352,4096,128,8,0,0,asm,13001+23001,2635.2017
gfx938,no_quant,torch.float16,6144,352,4096,128,8,0,0,asm,13001+23001,3099.4145
gfx938,no_quant,torch.float16,7168,352,4096,128,8,0,0,asm,13001+23001,3564.3297
gfx938,no_quant,torch.float16,7680,352,4096,128,8,0,0,asm,13001+23001,3648.124
gfx938,no_quant,torch.float16,8192,352,4096,128,8,0,0,asm,13001+23001,3963.4827
gfx938,no_quant,torch.float16,12288,352,4096,128,8,0,0,asm,13001+23001,5748.9863
gfx938,no_quant,torch.float16,16384,352,4096,128,8,0,0,asm,13001+23001,7546.4485
gfx938,no_quant,torch.float16,24576,352,4096,128,8,0,0,asm,13001+23001,11088.5202
gfx938,no_quant,torch.float16,32768,352,4096,128,8,0,0,asm,13001+23001,14713.3474
gfx938,no_quant,torch.float16,49152,352,4096,128,8,0,0,asm,13001+23001,21815.9769
gfx938,no_quant,torch.float16,65536,352,4096,128,8,0,0,asm,13001+23001,29012.8921
gfx938,no_quant,torch.float16,1,352,4096,129,9,0,0,asm,10004+20000,82.8296
gfx938,no_quant,torch.float16,2,352,4096,129,9,0,0,asm,10004+20002,117.517
gfx938,no_quant,torch.float16,4,352,4096,129,9,0,0,asm,10006+20002,183.4528
gfx938,no_quant,torch.float16,6,352,4096,129,9,0,0,asm,10006+20000,241.0813
gfx938,no_quant,torch.float16,8,352,4096,129,9,0,0,asm,10007+20000,279.1283
gfx938,no_quant,torch.float16,10,352,4096,129,9,0,0,asm,10006+20000,330.1271
gfx938,no_quant,torch.float16,12,352,4096,129,9,0,0,asm,10006+20000,359.8869
gfx938,no_quant,torch.float16,14,352,4096,129,9,0,0,asm,10006+20000,395.9155
gfx938,no_quant,torch.float16,16,352,4096,129,9,0,0,asm,10006+20000,424.8344
gfx938,no_quant,torch.float16,20,352,4096,129,9,0,0,asm,10007+20000,483.2763
gfx938,no_quant,torch.float16,24,352,4096,129,9,0,0,asm,10006+20000,521.8279
gfx938,no_quant,torch.float16,28,352,4096,129,9,0,0,asm,10006+20000,548.0873
gfx938,no_quant,torch.float16,32,352,4096,129,9,0,0,asm,10006+20000,558.2041
gfx938,no_quant,torch.float16,36,352,4096,129,9,0,0,asm,10006+20000,586.8205
gfx938,no_quant,torch.float16,40,352,4096,129,9,0,0,asm,10006+20000,588.6543
gfx938,no_quant,torch.float16,48,352,4096,129,9,0,0,asm,10006+20000,611.8296
gfx938,no_quant,torch.float16,56,352,4096,129,9,0,0,asm,10006+20000,614.9763
gfx938,no_quant,torch.float16,64,352,4096,129,9,0,0,asm,10006+20000,632.5423
gfx938,no_quant,torch.float16,72,352,4096,129,9,0,0,asm,10006+20000,624.0347
gfx938,no_quant,torch.float16,80,352,4096,129,9,0,0,asm,10006+20000,629.3024
gfx938,no_quant,torch.float16,88,352,4096,129,9,0,0,asm,10006+20000,631.3577
gfx938,no_quant,torch.float16,96,352,4096,129,9,0,0,asm,10006+20000,630.9926
gfx938,no_quant,torch.float16,104,352,4096,129,9,0,0,asm,10006+20000,633.9628
gfx938,no_quant,torch.float16,112,352,4096,129,9,0,0,asm,10007+20000,644.289
gfx938,no_quant,torch.float16,128,352,4096,129,9,0,0,asm,10007+20000,647.6202
gfx938,no_quant,torch.float16,144,352,4096,129,9,0,0,asm,10006+20000,659.6407
gfx938,no_quant,torch.float16,160,352,4096,129,9,0,0,asm,10006+20000,665.6427
gfx938,no_quant,torch.float16,192,352,4096,129,9,0,0,asm,11004+21001,682.6765
gfx938,no_quant,torch.float16,224,352,4096,129,9,0,0,asm,11004+21001,688.2437
gfx938,no_quant,torch.float16,256,352,4096,129,9,0,0,asm,11004+21001,694.6395
gfx938,no_quant,torch.float16,320,352,4096,129,9,0,0,asm,11002+21001,719.4435
gfx938,no_quant,torch.float16,384,352,4096,129,9,0,0,asm,11004+21001,752.6085
gfx938,no_quant,torch.float16,448,352,4096,129,9,0,0,asm,12000+22001,773.6054
gfx938,no_quant,torch.float16,512,352,4096,129,9,0,0,asm,12000+22001,791.353
gfx938,no_quant,torch.float16,576,352,4096,129,9,0,0,asm,12004+22001,804.8627
gfx938,no_quant,torch.float16,640,352,4096,129,9,0,0,asm,12004+22001,820.5673
gfx938,no_quant,torch.float16,768,352,4096,129,9,0,0,asm,12000+22001,862.1548
gfx938,no_quant,torch.float16,960,352,4096,129,9,0,0,asm,12001+22001,993.7481
gfx938,no_quant,torch.float16,1024,352,4096,129,9,0,0,asm,12001+22001,1051.5161
gfx938,no_quant,torch.float16,1280,352,4096,129,9,0,0,asm,13001+23001,1115.6184
gfx938,no_quant,torch.float16,1536,352,4096,129,9,0,0,asm,13001+23001,1145.0624
gfx938,no_quant,torch.float16,1920,352,4096,129,9,0,0,asm,12001+22001,1517.5169
gfx938,no_quant,torch.float16,2048,352,4096,129,9,0,0,asm,12001+22001,1602.4269
gfx938,no_quant,torch.float16,2304,352,4096,129,9,0,0,asm,12001+22001,1694.8448
gfx938,no_quant,torch.float16,2560,352,4096,129,9,0,0,asm,12001+22001,1768.7974
gfx938,no_quant,torch.float16,2816,352,4096,129,9,0,0,asm,13001+23001,1804.2844
gfx938,no_quant,torch.float16,3072,352,4096,129,9,0,0,asm,13001+23001,1848.514
gfx938,no_quant,torch.float16,3584,352,4096,129,9,0,0,asm,13001+23001,2137.4626
gfx938,no_quant,torch.float16,3840,352,4096,129,9,0,0,asm,13001+23001,2433.5947
gfx938,no_quant,torch.float16,4096,352,4096,129,9,0,0,asm,13001+23001,2581.0639
gfx938,no_quant,torch.float16,4608,352,4096,129,9,0,0,asm,13001+23001,2696.285
gfx938,no_quant,torch.float16,5120,352,4096,129,9,0,0,asm,13001+23001,2818.4465
gfx938,no_quant,torch.float16,5632,352,4096,129,9,0,0,asm,13001+23001,3244.0284
gfx938,no_quant,torch.float16,6144,352,4096,129,9,0,0,asm,13001+23001,3530.5874
gfx938,no_quant,torch.float16,6656,352,4096,129,9,0,0,asm,13001+23001,3601.098
gfx938,no_quant,torch.float16,7168,352,4096,129,9,0,0,asm,13001+23001,3889.9903
gfx938,no_quant,torch.float16,7680,352,4096,129,9,0,0,asm,13001+23001,4337.7228
gfx938,no_quant,torch.float16,8192,352,4096,129,9,0,0,asm,13001+23001,4443.3674
gfx938,no_quant,torch.float16,10240,352,4096,129,9,0,0,asm,13001+23001,5380.2134
gfx938,no_quant,torch.float16,12288,352,4096,129,9,0,0,asm,13001+23001,6382.2687
gfx938,no_quant,torch.float16,16384,352,4096,129,9,0,0,asm,13001+23001,8397.3437
gfx938,no_quant,torch.float16,24576,352,4096,129,9,0,0,asm,13001+23001,12379.6318
gfx938,no_quant,torch.float16,32768,352,4096,129,9,0,0,asm,13001+23001,16397.3012
gfx938,no_quant,torch.float16,40960,352,4096,129,9,0,0,asm,13001+23001,20398.5288
gfx938,no_quant,torch.float16,49152,352,4096,129,9,0,0,asm,13001+23001,24396.6972
gfx938,no_quant,torch.float16,65536,352,4096,129,9,0,0,asm,13001+23001,32435.0655
gfx936,no_quant,torch.float16,1,256,3072,256,8,0,0,asm,10006+20000,56.4327
gfx936,no_quant,torch.float16,2,256,3072,256,8,0,0,asm,10006+20000,85.2664
gfx936,no_quant,torch.float16,4,256,3072,256,8,0,0,asm,10004+20000,148.02
gfx936,no_quant,torch.float16,6,256,3072,256,8,0,0,asm,10001+20000,198.0409
gfx936,no_quant,torch.float16,8,256,3072,256,8,0,0,asm,10001+20000,237.9062
gfx936,no_quant,torch.float16,12,256,3072,256,8,0,0,asm,10001+20000,320.1882
gfx936,no_quant,torch.float16,16,256,3072,256,8,0,0,asm,10001+20000,388.3143
gfx936,no_quant,torch.float16,24,256,3072,256,8,0,0,asm,10001+20000,520.2353
gfx936,no_quant,torch.float16,32,256,3072,256,8,0,0,asm,10001+20000,634.3687
gfx936,no_quant,torch.float16,36,256,3072,256,8,0,0,asm,10001+20000,662.1298
gfx936,no_quant,torch.float16,48,256,3072,256,8,0,0,asm,10001+20000,745.2455
gfx936,no_quant,torch.float16,56,256,3072,256,8,0,0,asm,10001+20000,784.2686
gfx936,no_quant,torch.float16,64,256,3072,256,8,0,0,asm,10001+20000,822.5338
gfx936,no_quant,torch.float16,72,256,3072,256,8,0,0,asm,10001+20000,850.3484
gfx936,no_quant,torch.float16,80,256,3072,256,8,0,0,asm,10001+20000,875.1736
gfx936,no_quant,torch.float16,88,256,3072,256,8,0,0,asm,10001+20000,901.001
gfx936,no_quant,torch.float16,96,256,3072,256,8,0,0,asm,10001+20000,914.5758
gfx936,no_quant,torch.float16,100,256,3072,256,8,0,0,asm,10001+20000,917.5063
gfx936,no_quant,torch.float16,112,256,3072,256,8,0,0,asm,10001+20000,936.2515
gfx936,no_quant,torch.float16,128,256,3072,256,8,0,0,asm,10001+20000,967.6199
gfx936,no_quant,torch.float16,144,256,3072,256,8,0,0,asm,10001+20000,976.1083
gfx936,no_quant,torch.float16,160,256,3072,256,8,0,0,asm,10001+20000,987.5608
gfx936,no_quant,torch.float16,192,256,3072,256,8,0,0,asm,10001+20000,1007.7293
gfx936,no_quant,torch.float16,224,256,3072,256,8,0,0,asm,10007+20000,1009.22
gfx936,no_quant,torch.float16,256,256,3072,256,8,0,0,asm,10007+20000,1027.6957
gfx936,no_quant,torch.float16,320,256,3072,256,8,0,0,asm,10007+20000,1043.8052
gfx936,no_quant,torch.float16,384,256,3072,256,8,0,0,asm,10007+20000,1075.1736
gfx936,no_quant,torch.float16,448,256,3072,256,8,0,0,asm,10006+20000,1110.1966
gfx936,no_quant,torch.float16,512,256,3072,256,8,0,0,asm,11006+21001,1120.0746
gfx936,no_quant,torch.float16,640,256,3072,256,8,0,0,asm,12004+22001,1151.2998
gfx936,no_quant,torch.float16,768,256,3072,256,8,0,0,asm,12004+22001,1180.8324
gfx936,no_quant,torch.float16,896,256,3072,256,8,0,0,asm,12004+22001,1201.9524
gfx936,no_quant,torch.float16,1024,256,3072,256,8,0,0,asm,12004+22001,1221.1692
gfx936,no_quant,torch.float16,1280,256,3072,256,8,0,0,asm,12004+22001,1256.6892
gfx936,no_quant,torch.float16,1536,256,3072,256,8,0,0,asm,12004+22001,1313.9523
gfx936,no_quant,torch.float16,2048,256,3072,256,8,0,0,asm,13000+23001,1467.2068
gfx936,no_quant,torch.float16,2304,256,3072,256,8,0,0,asm,13000+23001,1512.9077
gfx936,no_quant,torch.float16,2560,256,3072,256,8,0,0,asm,13000+23001,1530.7098
gfx936,no_quant,torch.float16,3072,256,3072,256,8,0,0,asm,13000+23001,1615.5686
gfx936,no_quant,torch.float16,3584,256,3072,256,8,0,0,asm,13000+23001,1724.7306
gfx936,no_quant,torch.float16,4096,256,3072,256,8,0,0,asm,13001+23001,1918.8103
gfx936,no_quant,torch.float16,5120,256,3072,256,8,0,0,asm,13001+23001,2272.5277
gfx936,no_quant,torch.float16,6144,256,3072,256,8,0,0,asm,13001+23001,2343.0624
gfx936,no_quant,torch.float16,7168,256,3072,256,8,0,0,asm,13001+23001,2560.4684
gfx936,no_quant,torch.float16,8192,256,3072,256,8,0,0,asm,13001+23001,2878.8006
gfx936,no_quant,torch.float16,10240,256,3072,256,8,0,0,asm,13001+23001,3414.3448
gfx936,no_quant,torch.float16,12288,256,3072,256,8,0,0,asm,13001+23001,3988.8697
gfx936,no_quant,torch.float16,16384,256,3072,256,8,0,0,asm,13001+23001,5057.6343
gfx936,no_quant,torch.float16,24576,256,3072,256,8,0,0,asm,13001+23001,7355.5588
gfx936,no_quant,torch.float16,32768,256,3072,256,8,0,0,asm,13001+23001,9745.8034
gfx936,no_quant,torch.float16,1,128,3072,256,8,0,0,asm,10005+20000,42.0834
gfx936,no_quant,torch.float16,2,128,3072,256,8,0,0,asm,10006+20000,57.5023
gfx936,no_quant,torch.float16,4,128,3072,256,8,0,0,asm,10003+20000,89.1148
gfx936,no_quant,torch.float16,6,128,3072,256,8,0,0,asm,10004+20000,115.9274
gfx936,no_quant,torch.float16,8,128,3072,256,8,0,0,asm,10004+20000,140.0622
gfx936,no_quant,torch.float16,12,128,3072,256,8,0,0,asm,10004+20000,183.4137
gfx936,no_quant,torch.float16,16,128,3072,256,8,0,0,asm,10001+20000,217.6199
gfx936,no_quant,torch.float16,24,128,3072,256,8,0,0,asm,10001+20000,280.0841
gfx936,no_quant,torch.float16,32,128,3072,256,8,0,0,asm,10001+20000,347.9859
gfx936,no_quant,torch.float16,36,128,3072,256,8,0,0,asm,10001+20002,354.8798
gfx936,no_quant,torch.float16,48,128,3072,256,8,0,0,asm,10004+20000,397.8103
gfx936,no_quant,torch.float16,56,128,3072,256,8,0,0,asm,10001+20000,417.8355
gfx936,no_quant,torch.float16,64,128,3072,256,8,0,0,asm,10001+20000,431.9071
gfx936,no_quant,torch.float16,72,128,3072,256,8,0,0,asm,10001+20000,449.6586
gfx936,no_quant,torch.float16,80,128,3072,256,8,0,0,asm,10001+20000,466.3575
gfx936,no_quant,torch.float16,88,128,3072,256,8,0,0,asm,10001+20000,476.4375
gfx936,no_quant,torch.float16,96,128,3072,256,8,0,0,asm,10001+20000,484.1006
gfx936,no_quant,torch.float16,100,128,3072,256,8,0,0,asm,10001+20000,483.6543
gfx936,no_quant,torch.float16,112,128,3072,256,8,0,0,asm,10001+20000,496.6479
gfx936,no_quant,torch.float16,128,128,3072,256,8,0,0,asm,10001+20000,506.4332
gfx936,no_quant,torch.float16,144,128,3072,256,8,0,0,asm,10001+20000,514.7279
gfx936,no_quant,torch.float16,160,128,3072,256,8,0,0,asm,10001+20000,518.9469
gfx936,no_quant,torch.float16,192,128,3072,256,8,0,0,asm,10001+20002,528.2184
gfx936,no_quant,torch.float16,224,128,3072,256,8,0,0,asm,10001+20000,536.9594
gfx936,no_quant,torch.float16,256,128,3072,256,8,0,0,asm,10001+20002,542.1299
gfx936,no_quant,torch.float16,320,128,3072,256,8,0,0,asm,10001+20002,560.412
gfx936,no_quant,torch.float16,384,128,3072,256,8,0,0,asm,10007+20002,578.4752
gfx936,no_quant,torch.float16,448,128,3072,256,8,0,0,asm,10006+20002,595.0982
gfx936,no_quant,torch.float16,512,128,3072,256,8,0,0,asm,11006+21001,614.9719
gfx936,no_quant,torch.float16,640,128,3072,256,8,0,0,asm,11006+21001,643.1908
gfx936,no_quant,torch.float16,768,128,3072,256,8,0,0,asm,11006+21001,656.4455
gfx936,no_quant,torch.float16,896,128,3072,256,8,0,0,asm,11006+21001,669.5487
gfx936,no_quant,torch.float16,1024,128,3072,256,8,0,0,asm,11006+21001,709.4055
gfx936,no_quant,torch.float16,1280,128,3072,256,8,0,0,asm,12004+22001,751.9485
gfx936,no_quant,torch.float16,1536,128,3072,256,8,0,0,asm,12004+22001,792.2685
gfx936,no_quant,torch.float16,2048,128,3072,256,8,0,0,asm,12004+22001,896.9672
gfx936,no_quant,torch.float16,2304,128,3072,256,8,0,0,asm,13000+23001,963.6365
gfx936,no_quant,torch.float16,2560,128,3072,256,8,0,0,asm,13000+23001,1003.0975
gfx936,no_quant,torch.float16,3072,128,3072,256,8,0,0,asm,13000+23001,1068.8068
gfx936,no_quant,torch.float16,3584,128,3072,256,8,0,0,asm,13000+23001,1157.8004
gfx936,no_quant,torch.float16,4096,128,3072,256,8,0,0,asm,12001+22001,1282.457
gfx936,no_quant,torch.float16,5120,128,3072,256,8,0,0,asm,12001+22001,1514.4903
gfx936,no_quant,torch.float16,6144,128,3072,256,8,0,0,asm,13001+23001,1667.9553
gfx936,no_quant,torch.float16,7168,128,3072,256,8,0,0,asm,13001+23001,1819.8287
gfx936,no_quant,torch.float16,8192,128,3072,256,8,0,0,asm,13001+23001,2046.742
gfx936,no_quant,torch.float16,10240,128,3072,256,8,0,0,asm,13001+23001,2443.8613
gfx936,no_quant,torch.float16,12288,128,3072,256,8,0,0,asm,13001+23001,2844.9048
gfx936,no_quant,torch.float16,16384,128,3072,256,8,0,0,asm,13001+23001,3597.2571
gfx936,no_quant,torch.float16,24576,128,3072,256,8,0,0,asm,13001+23001,5205.65
gfx936,no_quant,torch.float16,32768,128,3072,256,8,0,0,asm,13001+23001,6847.9883
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,int4_w4a16,torch.float16,1,256,7168,256,8,0,0,asm,10000+20000,95.17214285714428
gfx936,int4_w4a16,torch.float16,2,256,7168,256,8,0,0,asm,10000+20000,109.64071428571371
gfx936,int4_w4a16,torch.float16,4,256,7168,256,8,0,0,asm,10000+20001,162.646428571428
gfx936,int4_w4a16,torch.float16,6,256,7168,256,8,0,0,asm,10000+20000,224.8634285714288
gfx936,int4_w4a16,torch.float16,8,256,7168,256,8,0,0,asm,10000+20000,245.8005714285721
gfx936,int4_w4a16,torch.float16,10,256,7168,256,8,0,0,asm,10000+20001,298.3948571428573
gfx936,int4_w4a16,torch.float16,12,256,7168,256,8,0,0,asm,10000+20001,304.8405714285706
gfx936,int4_w4a16,torch.float16,14,256,7168,256,8,0,0,asm,10000+20001,386.76042857142886
gfx936,int4_w4a16,torch.float16,16,256,7168,256,8,0,0,asm,10000+20001,421.7547142857137
gfx936,int4_w4a16,torch.float16,20,256,7168,256,8,0,0,asm,10000+20000,517.134571428571
gfx936,int4_w4a16,torch.float16,24,256,7168,256,8,0,0,asm,10000+20000,530.8487142857141
gfx936,int4_w4a16,torch.float16,28,256,7168,256,8,0,0,asm,10000+20001,571.7202857142856
gfx936,int4_w4a16,torch.float16,32,256,7168,256,8,0,0,asm,10000+20001,568.383142857143
gfx936,int4_w4a16,torch.float16,36,256,7168,256,8,0,0,asm,10000+20001,652.1515714285714
gfx936,int4_w4a16,torch.float16,40,256,7168,256,8,0,0,asm,10000+20001,700.4257142857138
gfx936,int4_w4a16,torch.float16,44,256,7168,256,8,0,0,asm,10000+20001,705.5685714285721
gfx936,int4_w4a16,torch.float16,48,256,7168,256,8,0,0,asm,10000+20001,696.4028571428581
gfx936,int4_w4a16,torch.float16,56,256,7168,256,8,0,0,asm,10000+20001,794.9171428571426
gfx936,int4_w4a16,torch.float16,64,256,7168,256,8,0,0,asm,10000+20001,814.9171428571414
gfx936,int4_w4a16,torch.float16,80,256,7168,256,8,0,0,asm,10000+20001,829.8885714285714
gfx936,int4_w4a16,torch.float16,96,256,7168,256,8,0,0,asm,10000+20001,911.3284285714284
gfx936,int4_w4a16,torch.float16,112,256,7168,256,8,0,0,asm,10000+20001,918.1169999999996
gfx936,int4_w4a16,torch.float16,128,256,7168,256,8,0,0,asm,10000+20001,926.8941428571424
gfx936,int4_w4a16,torch.float16,160,256,7168,256,8,0,0,asm,10000+20001,941.3170000000003
gfx936,int4_w4a16,torch.float16,192,256,7168,256,8,0,0,asm,10000+20001,958.139857142858
gfx936,int4_w4a16,torch.float16,224,256,7168,256,8,0,0,asm,10000+20001,983.6941428571432
gfx936,int4_w4a16,torch.float16,256,256,7168,256,8,0,0,asm,10000+20001,988.4255714285724
gfx936,int4_w4a16,torch.float16,320,256,7168,256,8,0,0,asm,10000+20001,1010.7332857142854
gfx936,int4_w4a16,torch.float16,384,256,7168,256,8,0,0,asm,10000+20001,1094.2761428571423
gfx936,int4_w4a16,torch.float16,448,256,7168,256,8,0,0,asm,10000+20001,1153.590142857143
gfx936,int4_w4a16,torch.float16,512,256,7168,256,8,0,0,asm,10000+20001,1306.458571428572
gfx936,int4_w4a16,torch.float16,576,256,7168,256,8,0,0,asm,11001+21001,1410.2527142857143
gfx936,int4_w4a16,torch.float16,640,256,7168,256,8,0,0,asm,11001+21001,1434.2071428571428
gfx936,int4_w4a16,torch.float16,704,256,7168,256,8,0,0,asm,11001+21001,1496.423999999999
gfx936,int4_w4a16,torch.float16,768,256,7168,256,8,0,0,asm,11001+21001,1520.1268571428573
gfx936,int4_w4a16,torch.float16,832,256,7168,256,8,0,0,asm,11001+21001,1607.280999999999
gfx936,int4_w4a16,torch.float16,896,256,7168,256,8,0,0,asm,11001+21001,1697.932285714286
gfx936,int4_w4a16,torch.float16,960,256,7168,256,8,0,0,asm,11001+21001,1793.5892857142867
gfx936,int4_w4a16,torch.float16,1024,256,7168,256,8,0,0,asm,11001+21001,1949.2920000000008
gfx936,int4_w4a16,torch.float16,1152,256,7168,256,8,0,0,asm,11001+21001,2259.9428571428566
gfx936,int4_w4a16,torch.float16,1280,256,7168,256,8,0,0,asm,11001+21001,2472.994
gfx936,int4_w4a16,torch.float16,1408,256,7168,256,8,0,0,asm,11001+21001,2536.4909999999995
gfx936,int4_w4a16,torch.float16,1536,256,7168,256,8,0,0,asm,11001+21001,2635.736571428572
gfx936,int4_w4a16,torch.float16,1664,256,7168,256,8,0,0,asm,11001+21001,2727.5991428571456
gfx936,int4_w4a16,torch.float16,1792,256,7168,256,8,0,0,asm,11001+21001,2847.301857142858
gfx936,int4_w4a16,torch.float16,1920,256,7168,256,8,0,0,asm,11001+21001,3030.9815714285733
gfx936,int4_w4a16,torch.float16,2048,256,7168,256,8,0,0,asm,11001+21001,3253.38114285714
gfx936,int4_w4a16,torch.float16,2304,256,7168,256,8,0,0,asm,11001+21001,3691.437714285715
gfx936,int4_w4a16,torch.float16,2560,256,7168,256,8,0,0,asm,11001+21001,3961.105857142853
gfx936,int4_w4a16,torch.float16,2816,256,7168,256,8,0,0,asm,11001+21001,4214.888285714294
gfx936,int4_w4a16,torch.float16,3072,256,7168,256,8,0,0,asm,11001+21001,4598.590571428569
gfx936,int4_w4a16,torch.float16,3328,256,7168,256,8,0,0,asm,11001+21001,4923.961571428568
gfx936,int4_w4a16,torch.float16,3584,256,7168,256,8,0,0,asm,11001+21001,5283.663857142858
gfx936,int4_w4a16,torch.float16,3840,256,7168,256,8,0,0,asm,11001+21001,5579.549000000005
gfx936,int4_w4a16,torch.float16,4096,256,7168,256,8,0,0,asm,11001+21001,5959.091142857148
gfx936,int4_w4a16,torch.float16,4608,256,7168,256,8,0,0,asm,11001+21001,6573.558857142861
gfx936,int4_w4a16,torch.float16,5120,256,7168,256,8,0,0,asm,11001+21001,7240.826571428568
gfx936,int4_w4a16,torch.float16,5632,256,7168,256,8,0,0,asm,11001+21001,7880.962714285714
gfx936,int4_w4a16,torch.float16,6144,256,7168,256,8,0,0,asm,11001+21001,8558.858571428571
gfx936,int4_w4a16,torch.float16,6656,256,7168,256,8,0,0,asm,11001+21001,9222.514857142862
gfx936,int4_w4a16,torch.float16,7168,256,7168,256,8,0,0,asm,11001+21001,9888.730857142857
gfx936,int4_w4a16,torch.float16,7680,256,7168,256,8,0,0,asm,11001+21001,10493.644714285716
gfx936,int4_w4a16,torch.float16,8192,256,7168,256,8,0,0,asm,11001+21001,11209.300285714282
gfx936,int4_w4a16,torch.float16,10240,256,7168,256,8,0,0,asm,11001+21001,13796.542142857152
gfx936,int4_w4a16,torch.float16,12288,256,7168,256,8,0,0,asm,11001+21001,16473.77242857143
gfx936,int4_w4a16,torch.float16,14336,256,7168,256,8,0,0,asm,11001+21001,19168.557142857146
gfx936,int4_w4a16,torch.float16,16384,256,7168,256,8,0,0,asm,11001+21001,21783.615857142864
gfx936,int4_w4a16,torch.float16,17408,256,7168,256,8,0,0,asm,11001+21001,23135.63657142856
gfx936,int4_w4a16,torch.float16,24576,256,7168,256,8,0,0,asm,11001+21001,32335.211
gfx936,int4_w4a16,torch.float16,32768,256,7168,256,8,0,0,asm,11001+21001,42933.38957142859
gfx938,int4_w4a16,torch.float16,1,256,7168,256,8,0,0,asm,10000+20000,105.43471428539071
gfx938,int4_w4a16,torch.float16,2,256,7168,256,8,0,0,asm,10000+20000,127.08042857237159
gfx938,int4_w4a16,torch.float16,4,256,7168,256,8,0,0,asm,10000+20001,192.08599999959446
gfx938,int4_w4a16,torch.float16,6,256,7168,256,8,0,0,asm,10000+20000,284.08557142796263
gfx938,int4_w4a16,torch.float16,8,256,7168,256,8,0,0,asm,10000+20002,344.4512857141838
gfx938,int4_w4a16,torch.float16,10,256,7168,256,8,0,0,asm,10000+20000,440.88528571384296
gfx938,int4_w4a16,torch.float16,12,256,7168,256,8,0,0,asm,10000+20001,501.20514285670856
gfx938,int4_w4a16,torch.float16,14,256,7168,256,8,0,0,asm,10000+20000,596.9989999990378
gfx938,int4_w4a16,torch.float16,16,256,7168,256,8,0,0,asm,10000+20002,605.4334285715928
gfx938,int4_w4a16,torch.float16,20,256,7168,256,8,0,0,asm,10000+20001,750.7557142856531
gfx938,int4_w4a16,torch.float16,24,256,7168,256,8,0,0,asm,10000+20001,756.40142857137
gfx938,int4_w4a16,torch.float16,28,256,7168,256,8,0,0,asm,10000+20001,825.547142857087
gfx938,int4_w4a16,torch.float16,32,256,7168,256,8,0,0,asm,10000+20001,836.5414285711678
gfx938,int4_w4a16,torch.float16,36,256,7168,256,8,0,0,asm,10000+20002,911.303857142904
gfx938,int4_w4a16,torch.float16,40,256,7168,256,8,0,0,asm,10000+20002,967.166571428567
gfx938,int4_w4a16,torch.float16,44,256,7168,256,8,0,0,asm,10000+20001,1061.2692857140541
gfx938,int4_w4a16,torch.float16,48,256,7168,256,8,0,0,asm,10000+20001,1066.9377142857495
gfx938,int4_w4a16,torch.float16,56,256,7168,256,8,0,0,asm,10000+20001,1116.629000000057
gfx938,int4_w4a16,torch.float16,64,256,7168,256,8,0,0,asm,10000+20002,1193.4288571427876
gfx938,int4_w4a16,torch.float16,80,256,7168,256,8,0,0,asm,10000+20002,1217.9315714285476
gfx938,int4_w4a16,torch.float16,96,256,7168,256,8,0,0,asm,10000+20002,1250.1371428567384
gfx938,int4_w4a16,torch.float16,112,256,7168,256,8,0,0,asm,10000+20002,1273.9772857142877
gfx938,int4_w4a16,torch.float16,128,256,7168,256,8,0,0,asm,10000+20002,1276.6285714285416
gfx938,int4_w4a16,torch.float16,160,256,7168,256,8,0,0,asm,10000+20002,1278.320142857198
gfx938,int4_w4a16,torch.float16,192,256,7168,256,8,0,0,asm,10000+20002,1289.4514285716493
gfx938,int4_w4a16,torch.float16,224,256,7168,256,8,0,0,asm,10000+20002,1295.0284285714984
gfx938,int4_w4a16,torch.float16,256,256,7168,256,8,0,0,asm,10000+20001,1408.8795714286555
gfx938,int4_w4a16,torch.float16,320,256,7168,256,8,0,0,asm,10000+20001,1426.959571428597
gfx938,int4_w4a16,torch.float16,384,256,7168,256,8,0,0,asm,10000+20001,1486.8908571428951
gfx938,int4_w4a16,torch.float16,448,256,7168,256,8,0,0,asm,10000+20002,1611.6447142859522
gfx938,int4_w4a16,torch.float16,512,256,7168,256,8,0,0,asm,10000+20002,1923.9182857143958
gfx938,int4_w4a16,torch.float16,576,256,7168,256,8,0,0,asm,10000+20002,2170.1348571429094
gfx938,int4_w4a16,torch.float16,640,256,7168,256,8,0,0,asm,10000+20001,2377.3797142855556
gfx938,int4_w4a16,torch.float16,704,256,7168,256,8,0,0,asm,10000+20002,2500.55657142893
gfx938,int4_w4a16,torch.float16,768,256,7168,256,8,0,0,asm,10000+20002,2559.2078571429342
gfx938,int4_w4a16,torch.float16,832,256,7168,256,8,0,0,asm,10000+20001,2760.692999999305
gfx938,int4_w4a16,torch.float16,896,256,7168,256,8,0,0,asm,10000+20002,2826.293000000263
gfx938,int4_w4a16,torch.float16,960,256,7168,256,8,0,0,asm,10000+20002,3070.77228571433
gfx938,int4_w4a16,torch.float16,1024,256,7168,256,8,0,0,asm,10000+20002,3187.7548571428715
gfx938,int4_w4a16,torch.float16,1152,256,7168,256,8,0,0,asm,10000+20002,3501.8795714285225
gfx938,int4_w4a16,torch.float16,1280,256,7168,256,8,0,0,asm,10000+20002,3815.9817142858437
gfx938,int4_w4a16,torch.float16,1408,256,7168,256,8,0,0,asm,10000+20002,4135.843714285708
gfx938,int4_w4a16,torch.float16,1536,256,7168,256,8,0,0,asm,10000+20002,4453.054285714236
gfx938,int4_w4a16,torch.float16,1664,256,7168,256,8,0,0,asm,10000+20002,4908.824428571521
gfx938,int4_w4a16,torch.float16,1792,256,7168,256,8,0,0,asm,10000+20002,5088.504000000057
gfx938,int4_w4a16,torch.float16,1920,256,7168,256,8,0,0,asm,10000+20002,5400.8005714285455
gfx938,int4_w4a16,torch.float16,2048,256,7168,256,8,0,0,asm,10000+20002,5717.8740000000025
gfx938,int4_w4a16,torch.float16,2304,256,7168,256,8,0,0,asm,10000+20002,6355.015000000048
gfx938,int4_w4a16,torch.float16,2560,256,7168,256,8,0,0,asm,10000+20002,7130.669857142909
gfx938,int4_w4a16,torch.float16,2816,256,7168,256,8,0,0,asm,10000+20002,7623.331428571405
gfx938,int4_w4a16,torch.float16,3072,256,7168,256,8,0,0,asm,10000+20002,8248.769285714088
gfx938,int4_w4a16,torch.float16,3328,256,7168,256,8,0,0,asm,10000+20002,8877.841571428573
gfx938,int4_w4a16,torch.float16,3584,256,7168,256,8,0,0,asm,10000+20002,9516.399999999574
gfx938,int4_w4a16,torch.float16,3840,256,7168,256,8,0,0,asm,10000+20002,10147.803285714293
gfx938,int4_w4a16,torch.float16,4096,256,7168,256,8,0,0,asm,10000+20002,10784.464142857187
gfx938,int4_w4a16,torch.float16,4608,256,7168,256,8,0,0,asm,10000+20002,12002.792285714431
gfx938,int4_w4a16,torch.float16,5120,256,7168,256,8,0,0,asm,10000+20002,13309.120142857179
gfx938,int4_w4a16,torch.float16,5632,256,7168,256,8,0,0,asm,10000+20002,14576.659714285517
gfx938,int4_w4a16,torch.float16,6144,256,7168,256,8,0,0,asm,10000+20002,15842.21071428606
gfx938,int4_w4a16,torch.float16,6656,256,7168,256,8,0,0,asm,10000+20002,17109.932714285194
gfx938,int4_w4a16,torch.float16,7168,256,7168,256,8,0,0,asm,10000+20002,18361.67728571487
gfx938,int4_w4a16,torch.float16,7680,256,7168,256,8,0,0,asm,10000+20002,19628.737285714065
gfx938,int4_w4a16,torch.float16,8192,256,7168,256,8,0,0,asm,10000+20002,20897.122571428772
gfx938,int4_w4a16,torch.float16,10240,256,7168,256,8,0,0,asm,10000+20002,25957.222142856703
gfx938,int4_w4a16,torch.float16,12288,256,7168,256,8,0,0,asm,10000+20002,31018.37357142857
gfx938,int4_w4a16,torch.float16,14336,256,7168,256,8,0,0,asm,10000+20002,36075.15457142866
gfx938,int4_w4a16,torch.float16,16384,256,7168,256,8,0,0,asm,10000+20002,41135.762714286466
gfx938,int4_w4a16,torch.float16,17408,256,7168,256,8,0,0,asm,10000+20002,43667.20685714267
gfx938,int4_w4a16,torch.float16,24576,256,7168,256,8,0,0,asm,10000+20002,61364.23214285701
gfx938,int4_w4a16,torch.float16,32768,256,7168,256,8,0,0,asm,10000+20002,81594.00357142859
gfx938,int4_w4a16,torch.float16,1,256,7168,384,8,0,0,asm,10000+20000,108.1967
gfx938,int4_w4a16,torch.float16,2,256,7168,384,8,0,0,asm,10000+20000,126.5040
gfx938,int4_w4a16,torch.float16,4,256,7168,384,8,0,0,asm,10000+20001,196.5924
gfx938,int4_w4a16,torch.float16,6,256,7168,384,8,0,0,asm,10000+20000,290.6636
gfx938,int4_w4a16,torch.float16,8,256,7168,384,8,0,0,asm,10000+20002,348.1119
gfx938,int4_w4a16,torch.float16,10,256,7168,384,8,0,0,asm,10000+20000,445.9054
gfx938,int4_w4a16,torch.float16,12,256,7168,384,8,0,0,asm,10000+20001,511.1852
gfx938,int4_w4a16,torch.float16,14,256,7168,384,8,0,0,asm,10000+20001,519.2441
gfx938,int4_w4a16,torch.float16,16,256,7168,384,8,0,0,asm,10000+20002,616.4397
gfx938,int4_w4a16,torch.float16,20,256,7168,384,8,0,0,asm,10000+20001,753.6237
gfx938,int4_w4a16,torch.float16,24,256,7168,384,8,0,0,asm,10000+20001,817.4551
gfx938,int4_w4a16,torch.float16,28,256,7168,384,8,0,0,asm,10000+20002,912.1243
gfx938,int4_w4a16,torch.float16,32,256,7168,384,8,0,0,asm,10000+20002,963.9222
gfx938,int4_w4a16,torch.float16,36,256,7168,384,8,0,0,asm,10000+20001,1108.6964
gfx938,int4_w4a16,torch.float16,40,256,7168,384,8,0,0,asm,10000+20002,1200.7804
gfx938,int4_w4a16,torch.float16,44,256,7168,384,8,0,0,asm,10000+20002,1252.2244
gfx938,int4_w4a16,torch.float16,48,256,7168,384,8,0,0,asm,10000+20002,1264.3423
gfx938,int4_w4a16,torch.float16,56,256,7168,384,8,0,0,asm,10000+20001,1378.8346
gfx938,int4_w4a16,torch.float16,64,256,7168,384,8,0,0,asm,10000+20002,1498.6154
gfx938,int4_w4a16,torch.float16,80,256,7168,384,8,0,0,asm,10000+20002,1581.3351
gfx938,int4_w4a16,torch.float16,96,256,7168,384,8,0,0,asm,10000+20001,1686.9685
gfx938,int4_w4a16,torch.float16,112,256,7168,384,8,0,0,asm,10000+20001,1739.7936
gfx938,int4_w4a16,torch.float16,128,256,7168,384,8,0,0,asm,10000+20002,1813.1493
gfx938,int4_w4a16,torch.float16,160,256,7168,384,8,0,0,asm,10000+20002,1869.6711
gfx938,int4_w4a16,torch.float16,192,256,7168,384,8,0,0,asm,10000+20002,1879.8691
gfx938,int4_w4a16,torch.float16,224,256,7168,384,8,0,0,asm,10000+20002,1898.5048
gfx938,int4_w4a16,torch.float16,256,256,7168,384,8,0,0,asm,10000+20002,1908.3069
gfx938,int4_w4a16,torch.float16,320,256,7168,384,8,0,0,asm,10000+20002,1914.6057
gfx938,int4_w4a16,torch.float16,384,256,7168,384,8,0,0,asm,10000+20001,2022.0243
gfx938,int4_w4a16,torch.float16,448,256,7168,384,8,0,0,asm,10000+20001,2031.7760
gfx938,int4_w4a16,torch.float16,512,256,7168,384,8,0,0,asm,10000+20001,2056.854
gfx938,int4_w4a16,torch.float16,576,256,7168,384,8,0,0,asm,10000+20002,2222.1249
gfx938,int4_w4a16,torch.float16,640,256,7168,384,8,0,0,asm,10000+20001,2354.6466
gfx938,int4_w4a16,torch.float16,768,256,7168,384,8,0,0,asm,10000+20002,2802.9235
gfx938,int4_w4a16,torch.float16,896,256,7168,384,8,0,0,asm,10000+20002,3359.1829
gfx938,int4_w4a16,torch.float16,1024,256,7168,384,8,0,0,asm,10000+20002,3622.8789
gfx938,int4_w4a16,torch.float16,1280,256,7168,384,8,0,0,asm,10000+20002,4052.1077
gfx938,int4_w4a16,torch.float16,1536,256,7168,384,8,0,0,asm,10000+20002,4672.0215
gfx938,int4_w4a16,torch.float16,2048,256,7168,384,8,0,0,asm,10000+20002,5924.0686
gfx938,int4_w4a16,torch.float16,2560,256,7168,384,8,0,0,asm,10000+20002,7228.8482
gfx938,int4_w4a16,torch.float16,3072,256,7168,384,8,0,0,asm,10000+20002,8496.5672
gfx938,int4_w4a16,torch.float16,3584,256,7168,384,8,0,0,asm,10000+20002,9699.309
gfx938,int4_w4a16,torch.float16,3840,256,7168,384,8,0,0,asm,10000+20002,10366.0861
gfx938,int4_w4a16,torch.float16,4096,256,7168,384,8,0,0,asm,10000+20002,10946.9519
gfx938,int4_w4a16,torch.float16,4608,256,7168,384,8,0,0,asm,10000+20002,12245.0451
gfx938,int4_w4a16,torch.float16,5120,256,7168,384,8,0,0,asm,10000+20002,13491.7789
gfx938,int4_w4a16,torch.float16,6144,256,7168,384,8,0,0,asm,10000+20002,15987.2496
gfx938,int4_w4a16,torch.float16,7168,256,7168,384,8,0,0,asm,10000+20002,18455.4978
gfx938,int4_w4a16,torch.float16,7680,256,7168,384,8,0,0,asm,10000+20002,19750.3316
gfx938,int4_w4a16,torch.float16,8192,256,7168,384,8,0,0,asm,10000+20002,21000.2742
gfx938,int4_w4a16,torch.float16,10240,256,7168,384,8,0,0,asm,10000+20002,26001.247
gfx938,int4_w4a16,torch.float16,12288,256,7168,384,8,0,0,asm,10000+20002,30978.9432
gfx938,int4_w4a16,torch.float16,16384,256,7168,384,8,0,0,asm,10000+20002,40987.1437
gfx938,int4_w4a16,torch.float16,24576,256,7168,384,8,0,0,asm,10000+20002,60960.2526
gfx938,int4_w4a16,torch.float16,32768,256,7168,384,8,0,0,asm,10000+20002,80978.0681
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,int4_w4a8,torch.float16,1,256,7168,256,8,0,0,asm,10001+20100,121.2912857142849
gfx936,int4_w4a8,torch.float16,2,256,7168,256,8,0,0,asm,10001+20000,137.86271428571425
gfx936,int4_w4a8,torch.float16,4,256,7168,256,8,0,0,asm,10002+20101,181.22271428571534
gfx936,int4_w4a8,torch.float16,6,256,7168,256,8,0,0,asm,10001+20100,243.78257142857066
gfx936,int4_w4a8,torch.float16,8,256,7168,256,8,0,0,asm,10001+20101,270.7997142857147
gfx936,int4_w4a8,torch.float16,10,256,7168,256,8,0,0,asm,10001+20101,305.10828571428607
gfx936,int4_w4a8,torch.float16,12,256,7168,256,8,0,0,asm,10002+20101,376.28528571428666
gfx936,int4_w4a8,torch.float16,14,256,7168,256,8,0,0,asm,10001+20101,385.5881428571429
gfx936,int4_w4a8,torch.float16,16,256,7168,256,8,0,0,asm,10002+20101,415.09671428571426
gfx936,int4_w4a8,torch.float16,20,256,7168,256,8,0,0,asm,10001+20101,496.4679999999984
gfx936,int4_w4a8,torch.float16,24,256,7168,256,8,0,0,asm,10001+20101,504.7651428571422
gfx936,int4_w4a8,torch.float16,28,256,7168,256,8,0,0,asm,10001+20101,546.5937142857139
gfx936,int4_w4a8,torch.float16,32,256,7168,256,8,0,0,asm,10001+20101,552.2165714285693
gfx936,int4_w4a8,torch.float16,36,256,7168,256,8,0,0,asm,10001+20101,629.9535714285719
gfx936,int4_w4a8,torch.float16,40,256,7168,256,8,0,0,asm,10002+20101,665.0164285714278
gfx936,int4_w4a8,torch.float16,44,256,7168,256,8,0,0,asm,10001+20101,673.3135714285709
gfx936,int4_w4a8,torch.float16,48,256,7168,256,8,0,0,asm,10001+20101,732.5589999999995
gfx936,int4_w4a8,torch.float16,56,256,7168,256,8,0,0,asm,10001+20101,769.8848571428576
gfx936,int4_w4a8,torch.float16,64,256,7168,256,8,0,0,asm,10001+20101,783.5077142857135
gfx936,int4_w4a8,torch.float16,72,256,7168,256,8,0,0,asm,10002+20101,816.6962857142868
gfx936,int4_w4a8,torch.float16,80,256,7168,256,8,0,0,asm,10001+20101,812.2162857142861
gfx936,int4_w4a8,torch.float16,96,256,7168,256,8,0,0,asm,10001+20101,834.7534285714281
gfx936,int4_w4a8,torch.float16,112,256,7168,256,8,0,0,asm,10001+20101,888.2618571428568
gfx936,int4_w4a8,torch.float16,128,256,7168,256,8,0,0,asm,10001+20101,894.7989999999998
gfx936,int4_w4a8,torch.float16,160,256,7168,256,8,0,0,asm,10002+20101,916.1018571428574
gfx936,int4_w4a8,torch.float16,192,256,7168,256,8,0,0,asm,10002+20101,937.0160000000004
gfx936,int4_w4a8,torch.float16,224,256,7168,256,8,0,0,asm,10002+20101,980.3990000000005
gfx936,int4_w4a8,torch.float16,256,256,7168,256,8,0,0,asm,10002+20101,989.221714285714
gfx936,int4_w4a8,torch.float16,320,256,7168,256,8,0,0,asm,10002+20101,1032.2160000000001
gfx936,int4_w4a8,torch.float16,384,256,7168,256,8,0,0,asm,10002+20101,1075.0731428571432
gfx936,int4_w4a8,torch.float16,448,256,7168,256,8,0,0,asm,10002+20101,1112.9245714285714
gfx936,int4_w4a8,torch.float16,512,256,7168,256,8,0,0,asm,11001+21101,1172.170142857143
gfx936,int4_w4a8,torch.float16,576,256,7168,256,8,0,0,asm,11001+21101,1200.741428571429
gfx936,int4_w4a8,torch.float16,640,256,7168,256,8,0,0,asm,11001+21101,1236.4672857142875
gfx936,int4_w4a8,torch.float16,704,256,7168,256,8,0,0,asm,11001+21101,1269.9985714285708
gfx936,int4_w4a8,torch.float16,768,256,7168,256,8,0,0,asm,11001+21101,1321.54142857143
gfx936,int4_w4a8,torch.float16,832,256,7168,256,8,0,0,asm,11001+21101,1423.6670000000001
gfx936,int4_w4a8,torch.float16,896,256,7168,256,8,0,0,asm,11001+21101,1467.1412857142861
gfx936,int4_w4a8,torch.float16,960,256,7168,256,8,0,0,asm,11001+21101,1529.1754285714298
gfx936,int4_w4a8,torch.float16,1024,256,7168,256,8,0,0,asm,11001+21101,1651.9409999999991
gfx936,int4_w4a8,torch.float16,1152,256,7168,256,8,0,0,asm,12000+22101,1841.1522857142859
gfx936,int4_w4a8,torch.float16,1280,256,7168,256,8,0,0,asm,12000+22101,1928.740714285715
gfx936,int4_w4a8,torch.float16,1408,256,7168,256,8,0,0,asm,12000+22101,2031.506428571427
gfx936,int4_w4a8,torch.float16,1536,256,7168,256,8,0,0,asm,12000+22100,2093.7921428571417
gfx936,int4_w4a8,torch.float16,1664,256,7168,256,8,0,0,asm,12000+22100,2159.643428571429
gfx936,int4_w4a8,torch.float16,1792,256,7168,256,8,0,0,asm,12000+22100,2340.2147142857125
gfx936,int4_w4a8,torch.float16,1920,256,7168,256,8,0,0,asm,12000+22101,2536.511571428572
gfx936,int4_w4a8,torch.float16,2048,256,7168,256,8,0,0,asm,12000+22101,2711.5742857142855
gfx936,int4_w4a8,torch.float16,2304,256,7168,256,8,0,0,asm,12000+22101,3163.2538571428563
gfx936,int4_w4a8,torch.float16,2560,256,7168,256,8,0,0,asm,11001+21101,3370.6592857142864
gfx936,int4_w4a8,torch.float16,2816,256,7168,256,8,0,0,asm,12000+22101,3553.2875714285706
gfx936,int4_w4a8,torch.float16,3072,256,7168,256,8,0,0,asm,12000+22101,3640.8532857142886
gfx936,int4_w4a8,torch.float16,3328,256,7168,256,8,0,0,asm,12000+22101,3754.5674285714254
gfx936,int4_w4a8,torch.float16,3584,256,7168,256,8,0,0,asm,12000+22101,4066.704285714291
gfx936,int4_w4a8,torch.float16,3840,256,7168,256,8,0,0,asm,12000+22101,4285.606857142853
gfx936,int4_w4a8,torch.float16,4096,256,7168,256,8,0,0,asm,12000+22101,4511.504
gfx936,int4_w4a8,torch.float16,4608,256,7168,256,8,0,0,asm,12000+22101,5246.771714285715
gfx936,int4_w4a8,torch.float16,5120,256,7168,256,8,0,0,asm,12000+22101,5601.42285714286
gfx936,int4_w4a8,torch.float16,5632,256,7168,256,8,0,0,asm,12000+22101,5841.239571428574
gfx936,int4_w4a8,torch.float16,6144,256,7168,256,8,0,0,asm,12000+22101,6483.31914285714
gfx936,int4_w4a8,torch.float16,6656,256,7168,256,8,0,0,asm,12000+22101,7094.564285714291
gfx936,int4_w4a8,torch.float16,7168,256,7168,256,8,0,0,asm,12000+22101,7407.546857142855
gfx936,int4_w4a8,torch.float16,7680,256,7168,256,8,0,0,asm,12000+22101,7759.112571428579
gfx936,int4_w4a8,torch.float16,8192,256,7168,256,8,0,0,asm,12000+22101,8344.666142857135
gfx936,int4_w4a8,torch.float16,10240,256,7168,256,8,0,0,asm,12000+22101,10278.127285714294
gfx936,int4_w4a8,torch.float16,12288,256,7168,256,8,0,0,asm,12000+22101,12087.954142857148
gfx936,int4_w4a8,torch.float16,14336,256,7168,256,8,0,0,asm,12000+22101,13912.912571428593
gfx936,int4_w4a8,torch.float16,16384,256,7168,256,8,0,0,asm,12000+22101,15923.08257142857
gfx936,int4_w4a8,torch.float16,17408,256,7168,256,8,0,0,asm,13000+23101,17620.064000000006
gfx936,int4_w4a8,torch.float16,24576,256,7168,256,8,0,0,asm,13000+23101,22840.699571428548
gfx936,int4_w4a8,torch.float16,32768,256,7168,256,8,0,0,asm,13000+23101,29839.300142857148
gfx936,int4_w4a8,torch.float16,1,128,7168,256,8,0,0,asm,10001+20000,118.84557142857135
gfx936,int4_w4a8,torch.float16,8,128,7168,256,8,0,0,asm,10002+20000,210.50271428571457
gfx936,int4_w4a8,torch.float16,32,128,7168,256,8,0,0,asm,10002+20000,410.98257142857136
gfx936,int4_w4a8,torch.float16,48,128,7168,256,8,0,0,asm,10001+20000,486.6395714285716
gfx936,int4_w4a8,torch.float16,64,128,7168,256,8,0,0,asm,10001+20000,507.0281428571426
gfx936,int4_w4a8,torch.float16,80,128,7168,256,8,0,0,asm,10001+20000,530.9595714285716
gfx936,int4_w4a8,torch.float16,96,128,7168,256,8,0,0,asm,10002+20000,564.7651428571434
gfx936,int4_w4a8,torch.float16,128,128,7168,256,8,0,0,asm,10002+20000,588.8794285714288
gfx936,int4_w4a8,torch.float16,256,128,7168,256,8,0,0,asm,10002+20000,651.4622857142858
gfx936,int4_w4a8,torch.float16,512,128,7168,256,8,0,0,asm,11001+21000,816.7192857142861
gfx936,int4_w4a8,torch.float16,768,128,7168,256,8,0,0,asm,11001+21000,905.7248571428562
gfx936,int4_w4a8,torch.float16,1024,128,7168,256,8,0,0,asm,11001+21000,1194.478857142858
gfx936,int4_w4a8,torch.float16,2048,128,7168,256,8,0,0,asm,11001+21000,2014.7065714285711
gfx936,int4_w4a8,torch.float16,3072,128,7168,256,8,0,0,asm,13000+23000,2794.6144285714277
gfx936,int4_w4a8,torch.float16,4096,128,7168,256,8,0,0,asm,12000+22000,3567.93942857143
gfx936,int4_w4a8,torch.float16,5120,128,7168,256,8,0,0,asm,12000+22000,4365.652857142859
gfx936,int4_w4a8,torch.float16,6144,128,7168,256,8,0,0,asm,12000+22000,5152.532285714286
gfx936,int4_w4a8,torch.float16,8192,128,7168,256,8,0,0,asm,13000+23000,6526.58800000001
gfx936,int4_w4a8,torch.float16,10240,128,7168,256,8,0,0,asm,13000+23000,8007.180714285722
gfx936,int4_w4a8,torch.float16,12288,128,7168,256,8,0,0,asm,13000+23000,9478.585142857133
gfx936,int4_w4a8,torch.float16,16384,128,7168,256,8,0,0,asm,13000+23000,12350.97114285713
gfx936,int4_w4a8,torch.float16,24576,128,7168,256,8,0,0,asm,13000+23000,17921.823142857134
gfx936,int4_w4a8,torch.float16,32768,128,7168,256,8,0,0,asm,13000+23000,23625.54328571425
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,int8_w8a8_channel,torch.float16,1,128,7168,256,8,0,0,asm,10000+20100,62.7804
gfx936,int8_w8a8_channel,torch.float16,2,128,7168,256,8,0,0,asm,10006+20102,78.3931
gfx936,int8_w8a8_channel,torch.float16,3,128,7168,256,8,0,0,asm,10009+20102,97.3237
gfx936,int8_w8a8_channel,torch.float16,4,128,7168,256,8,0,0,asm,10010+20102,117.012
gfx936,int8_w8a8_channel,torch.float16,5,128,7168,256,8,0,0,asm,10011+20102,138.9489
gfx936,int8_w8a8_channel,torch.float16,6,128,7168,256,8,0,0,asm,10001+20102,161.0289
gfx936,int8_w8a8_channel,torch.float16,7,128,7168,256,8,0,0,asm,10013+20102,177.4583
gfx936,int8_w8a8_channel,torch.float16,8,128,7168,256,8,0,0,asm,10001+20102,187.4036
gfx936,int8_w8a8_channel,torch.float16,9,128,7168,256,8,0,0,asm,10000+20102,202.8142
gfx936,int8_w8a8_channel,torch.float16,10,128,7168,256,8,0,0,asm,10001+20102,214.7384
gfx936,int8_w8a8_channel,torch.float16,11,128,7168,256,8,0,0,asm,10000+20102,231.7405
gfx936,int8_w8a8_channel,torch.float16,12,128,7168,256,8,0,0,asm,10001+20102,245.029
gfx936,int8_w8a8_channel,torch.float16,13,128,7168,256,8,0,0,asm,10001+20102,264.4648
gfx936,int8_w8a8_channel,torch.float16,14,128,7168,256,8,0,0,asm,10001+20102,276.8016
gfx936,int8_w8a8_channel,torch.float16,15,128,7168,256,8,0,0,asm,10000+20102,287.3027
gfx936,int8_w8a8_channel,torch.float16,16,128,7168,256,8,0,0,asm,10000+20102,291.2606
gfx936,int8_w8a8_channel,torch.float16,17,128,7168,256,8,0,0,asm,10001+20102,294.9376
gfx936,int8_w8a8_channel,torch.float16,18,128,7168,256,8,0,0,asm,10000+20102,310.9124
gfx936,int8_w8a8_channel,torch.float16,20,128,7168,256,8,0,0,asm,10001+20001,336.7987
gfx936,int8_w8a8_channel,torch.float16,24,128,7168,256,8,0,0,asm,10001+20001,378.6513
gfx936,int8_w8a8_channel,torch.float16,28,128,7168,256,8,0,0,asm,10001+20001,432.1786
gfx936,int8_w8a8_channel,torch.float16,32,128,7168,256,8,0,0,asm,10001+20001,459.5133
gfx936,int8_w8a8_channel,torch.float16,34,128,7168,256,8,0,0,asm,10000+20001,458.9208
gfx936,int8_w8a8_channel,torch.float16,36,128,7168,256,8,0,0,asm,10001+20001,476.6135
gfx936,int8_w8a8_channel,torch.float16,40,128,7168,256,8,0,0,asm,10001+20001,492.2177
gfx936,int8_w8a8_channel,torch.float16,44,128,7168,256,8,0,0,asm,10001+20001,516.9756
gfx936,int8_w8a8_channel,torch.float16,48,128,7168,256,8,0,0,asm,10001+20001,527.0556
gfx936,int8_w8a8_channel,torch.float16,56,128,7168,256,8,0,0,asm,10001+20001,554.8452
gfx936,int8_w8a8_channel,torch.float16,64,128,7168,256,8,0,0,asm,10001+20001,576.5378
gfx936,int8_w8a8_channel,torch.float16,68,128,7168,256,8,0,0,asm,10000+20001,581.8515
gfx936,int8_w8a8_channel,torch.float16,72,128,7168,256,8,0,0,asm,10000+20001,595.1904
gfx936,int8_w8a8_channel,torch.float16,80,128,7168,256,8,0,0,asm,10001+20001,611.2831
gfx936,int8_w8a8_channel,torch.float16,88,128,7168,256,8,0,0,asm,10001+20001,635.0894
gfx936,int8_w8a8_channel,torch.float16,96,128,7168,256,8,0,0,asm,10001+20001,644.9505
gfx936,int8_w8a8_channel,torch.float16,104,128,7168,256,8,0,0,asm,10000+20001,650.0705
gfx936,int8_w8a8_channel,torch.float16,112,128,7168,256,8,0,0,asm,10001+20001,657.5484
gfx936,int8_w8a8_channel,torch.float16,128,128,7168,256,8,0,0,asm,10001+20001,683.5779
gfx936,int8_w8a8_channel,torch.float16,144,128,7168,256,8,0,0,asm,10001+20001,686.4916
gfx936,int8_w8a8_channel,torch.float16,160,128,7168,256,8,0,0,asm,10001+20001,696.2768
gfx936,int8_w8a8_channel,torch.float16,192,128,7168,256,8,0,0,asm,10001+20001,709.7168
gfx936,int8_w8a8_channel,torch.float16,224,128,7168,256,8,0,0,asm,10001+20001,740.2179
gfx936,int8_w8a8_channel,torch.float16,256,128,7168,256,8,0,0,asm,10001+20001,745.6664
gfx936,int8_w8a8_channel,torch.float16,320,128,7168,256,8,0,0,asm,11001+21001,775.7295
gfx936,int8_w8a8_channel,torch.float16,384,128,7168,256,8,0,0,asm,11001+21001,795.1484
gfx936,int8_w8a8_channel,torch.float16,448,128,7168,256,8,0,0,asm,11001+21001,825.2537
gfx936,int8_w8a8_channel,torch.float16,512,128,7168,256,8,0,0,asm,11001+21001,846.2138
gfx936,int8_w8a8_channel,torch.float16,576,128,7168,256,8,0,0,asm,11001+21001,871.5864
gfx936,int8_w8a8_channel,torch.float16,640,128,7168,256,8,0,0,asm,11001+21001,892.3527
gfx936,int8_w8a8_channel,torch.float16,704,128,7168,256,8,0,0,asm,11006+21001,916.4117
gfx936,int8_w8a8_channel,torch.float16,768,128,7168,256,8,0,0,asm,11006+21001,938.736
gfx936,int8_w8a8_channel,torch.float16,832,128,7168,256,8,0,0,asm,11007+21001,965.1192
gfx936,int8_w8a8_channel,torch.float16,896,128,7168,256,8,0,0,asm,11007+21001,981.9782
gfx936,int8_w8a8_channel,torch.float16,960,128,7168,256,8,0,0,asm,11006+21001,1012.9761
gfx936,int8_w8a8_channel,torch.float16,1024,128,7168,256,8,0,0,asm,11007+21001,1019.0813
gfx936,int8_w8a8_channel,torch.float16,1152,128,7168,256,8,0,0,asm,11005+21001,1077.9614
gfx936,int8_w8a8_channel,torch.float16,1280,128,7168,256,8,0,0,asm,12004+22001,1130.8541
gfx936,int8_w8a8_channel,torch.float16,1408,128,7168,256,8,0,0,asm,12004+22001,1175.7888
gfx936,int8_w8a8_channel,torch.float16,1536,128,7168,256,8,0,0,asm,12004+22001,1212.8668
gfx936,int8_w8a8_channel,torch.float16,1664,128,7168,256,8,0,0,asm,12004+22001,1250.3489
gfx936,int8_w8a8_channel,torch.float16,1792,128,7168,256,8,0,0,asm,11005+21001,1300.5047
gfx936,int8_w8a8_channel,torch.float16,1920,128,7168,256,8,0,0,asm,12004+22001,1373.9701
gfx936,int8_w8a8_channel,torch.float16,2048,128,7168,256,8,0,0,asm,12005+22001,1414.9982
gfx936,int8_w8a8_channel,torch.float16,2304,128,7168,256,8,0,0,asm,12005+22001,1543.9078
gfx936,int8_w8a8_channel,torch.float16,2560,128,7168,256,8,0,0,asm,13000+23001,1663.1165
gfx936,int8_w8a8_channel,torch.float16,2816,128,7168,256,8,0,0,asm,13000+23001,1722.0387
gfx936,int8_w8a8_channel,torch.float16,3072,128,7168,256,8,0,0,asm,12005+22001,1793.9798
gfx936,int8_w8a8_channel,torch.float16,3328,128,7168,256,8,0,0,asm,12001+22001,1865.4831
gfx936,int8_w8a8_channel,torch.float16,3584,128,7168,256,8,0,0,asm,12001+22001,1932.7758
gfx936,int8_w8a8_channel,torch.float16,3840,128,7168,256,8,0,0,asm,12001+22001,2087.9508
gfx936,int8_w8a8_channel,torch.float16,4096,128,7168,256,8,0,0,asm,12001+22001,2196.8436
gfx936,int8_w8a8_channel,torch.float16,4608,128,7168,256,8,0,0,asm,12001+22001,2510.9156
gfx936,int8_w8a8_channel,torch.float16,5120,128,7168,256,8,0,0,asm,12001+22001,2654.6632
gfx936,int8_w8a8_channel,torch.float16,5632,128,7168,256,8,0,0,asm,12003+22001,2828.9119
gfx936,int8_w8a8_channel,torch.float16,6144,128,7168,256,8,0,0,asm,13001+23001,3011.9016
gfx936,int8_w8a8_channel,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23001,3129.9651
gfx936,int8_w8a8_channel,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23001,3264.7526
gfx936,int8_w8a8_channel,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23001,3438.3445
gfx936,int8_w8a8_channel,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23001,3778.766
gfx936,int8_w8a8_channel,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23001,4631.5252
gfx936,int8_w8a8_channel,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23001,5377.9096
gfx936,int8_w8a8_channel,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23001,6130.6435
gfx936,int8_w8a8_channel,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23001,7020.1861
gfx936,int8_w8a8_channel,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23001,7488.0522
gfx936,int8_w8a8_channel,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23001,10191.3578
gfx936,int8_w8a8_channel,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23001,13416.1804
gfx936,int8_w8a8_channel,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15540.521
gfx936,int8_w8a8_channel,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23101,19230.8184
gfx936,int8_w8a8_channel,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23001,22907.4573
gfx936,int8_w8a8_channel,torch.float16,1,256,7168,256,8,0,0,asm,10001+20001,78.2921
gfx936,int8_w8a8_channel,torch.float16,2,256,7168,256,8,0,0,asm,10002+20001,118.991
gfx936,int8_w8a8_channel,torch.float16,3,256,7168,256,8,0,0,asm,10001+20001,162.9827
gfx936,int8_w8a8_channel,torch.float16,4,256,7168,256,8,0,0,asm,10001+20001,206.8144
gfx936,int8_w8a8_channel,torch.float16,5,256,7168,256,8,0,0,asm,10001+20001,237.9892
gfx936,int8_w8a8_channel,torch.float16,6,256,7168,256,8,0,0,asm,10001+20001,273.4584
gfx936,int8_w8a8_channel,torch.float16,7,256,7168,256,8,0,0,asm,10001+20001,304.4734
gfx936,int8_w8a8_channel,torch.float16,8,256,7168,256,8,0,0,asm,10001+20001,327.3113
gfx936,int8_w8a8_channel,torch.float16,9,256,7168,256,8,0,0,asm,10001+20001,361.2314
gfx936,int8_w8a8_channel,torch.float16,10,256,7168,256,8,0,0,asm,10000+20001,388.6503
gfx936,int8_w8a8_channel,torch.float16,11,256,7168,256,8,0,0,asm,10001+20001,417.4167
gfx936,int8_w8a8_channel,torch.float16,12,256,7168,256,8,0,0,asm,10001+20001,436.6167
gfx936,int8_w8a8_channel,torch.float16,13,256,7168,256,8,0,0,asm,10000+20001,459.8252
gfx936,int8_w8a8_channel,torch.float16,14,256,7168,256,8,0,0,asm,10000+20001,493.1473
gfx936,int8_w8a8_channel,torch.float16,15,256,7168,256,8,0,0,asm,10001+20001,512.6842
gfx936,int8_w8a8_channel,torch.float16,16,256,7168,256,8,0,0,asm,10000+20001,528.9031
gfx936,int8_w8a8_channel,torch.float16,17,256,7168,256,8,0,0,asm,10000+20001,544.2181
gfx936,int8_w8a8_channel,torch.float16,18,256,7168,256,8,0,0,asm,10001+20001,569.5065
gfx936,int8_w8a8_channel,torch.float16,20,256,7168,256,8,0,0,asm,10000+20001,618.4751
gfx936,int8_w8a8_channel,torch.float16,24,256,7168,256,8,0,0,asm,10000+20001,709.7258
gfx936,int8_w8a8_channel,torch.float16,28,256,7168,256,8,0,0,asm,10000+20001,809.2237
gfx936,int8_w8a8_channel,torch.float16,32,256,7168,256,8,0,0,asm,10000+20001,864.8196
gfx936,int8_w8a8_channel,torch.float16,34,256,7168,256,8,0,0,asm,10000+20001,879.0063
gfx936,int8_w8a8_channel,torch.float16,36,256,7168,256,8,0,0,asm,10010+20001,908.7073
gfx936,int8_w8a8_channel,torch.float16,40,256,7168,256,8,0,0,asm,10000+20000,952.076
gfx936,int8_w8a8_channel,torch.float16,44,256,7168,256,8,0,0,asm,11000+21000,996.2529
gfx936,int8_w8a8_channel,torch.float16,48,256,7168,256,8,0,0,asm,10000+20000,1022.4591
gfx936,int8_w8a8_channel,torch.float16,56,256,7168,256,8,0,0,asm,11000+21000,1080.8678
gfx936,int8_w8a8_channel,torch.float16,64,256,7168,256,8,0,0,asm,11000+21000,1122.788
gfx936,int8_w8a8_channel,torch.float16,68,256,7168,256,8,0,0,asm,11000+21000,1136.0427
gfx936,int8_w8a8_channel,torch.float16,72,256,7168,256,8,0,0,asm,11000+21000,1163.3776
gfx936,int8_w8a8_channel,torch.float16,80,256,7168,256,8,0,0,asm,11000+21000,1201.1039
gfx936,int8_w8a8_channel,torch.float16,88,256,7168,256,8,0,0,asm,11000+21000,1241.1966
gfx936,int8_w8a8_channel,torch.float16,96,256,7168,256,8,0,0,asm,11000+21000,1260.2618
gfx936,int8_w8a8_channel,torch.float16,104,256,7168,256,8,0,0,asm,11000+21000,1273.7944
gfx936,int8_w8a8_channel,torch.float16,112,256,7168,256,8,0,0,asm,11000+21001,1286.4258
gfx936,int8_w8a8_channel,torch.float16,128,256,7168,256,8,0,0,asm,11000+21000,1321.8448
gfx936,int8_w8a8_channel,torch.float16,144,256,7168,256,8,0,0,asm,10010+20001,1338.8132
gfx936,int8_w8a8_channel,torch.float16,160,256,7168,256,8,0,0,asm,11000+21000,1357.4742
gfx936,int8_w8a8_channel,torch.float16,192,256,7168,256,8,0,0,asm,10010+20001,1372.8173
gfx936,int8_w8a8_channel,torch.float16,224,256,7168,256,8,0,0,asm,10010+20001,1399.2174
gfx936,int8_w8a8_channel,torch.float16,256,256,7168,256,8,0,0,asm,10010+20001,1403.5626
gfx936,int8_w8a8_channel,torch.float16,320,256,7168,256,8,0,0,asm,10010+20001,1447.9416
gfx936,int8_w8a8_channel,torch.float16,384,256,7168,256,8,0,0,asm,11000+21001,1475.1079
gfx936,int8_w8a8_channel,torch.float16,448,256,7168,256,8,0,0,asm,10013+20001,1487.9921
gfx936,int8_w8a8_channel,torch.float16,512,256,7168,256,8,0,0,asm,10013+20001,1500.4553
gfx936,int8_w8a8_channel,torch.float16,576,256,7168,256,8,0,0,asm,10013+20001,1573.1711
gfx936,int8_w8a8_channel,torch.float16,640,256,7168,256,8,0,0,asm,10011+20001,1601.2554
gfx936,int8_w8a8_channel,torch.float16,704,256,7168,256,8,0,0,asm,11001+21001,1633.8197
gfx936,int8_w8a8_channel,torch.float16,768,256,7168,256,8,0,0,asm,10011+20001,1668.1186
gfx936,int8_w8a8_channel,torch.float16,832,256,7168,256,8,0,0,asm,11006+21001,1701.5249
gfx936,int8_w8a8_channel,torch.float16,896,256,7168,256,8,0,0,asm,11006+21001,1721.0365
gfx936,int8_w8a8_channel,torch.float16,960,256,7168,256,8,0,0,asm,11007+21001,1727.6049
gfx936,int8_w8a8_channel,torch.float16,1024,256,7168,256,8,0,0,asm,11007+21001,1738.0049
gfx936,int8_w8a8_channel,torch.float16,1152,256,7168,256,8,0,0,asm,12004+22001,1793.9292
gfx936,int8_w8a8_channel,torch.float16,1280,256,7168,256,8,0,0,asm,11005+21001,1868.9946
gfx936,int8_w8a8_channel,torch.float16,1408,256,7168,256,8,0,0,asm,11005+21001,1902.3756
gfx936,int8_w8a8_channel,torch.float16,1536,256,7168,256,8,0,0,asm,11005+21001,1928.0683
gfx936,int8_w8a8_channel,torch.float16,1664,256,7168,256,8,0,0,asm,11005+21001,2025.9967
gfx936,int8_w8a8_channel,torch.float16,1792,256,7168,256,8,0,0,asm,12004+22001,2038.5442
gfx936,int8_w8a8_channel,torch.float16,1920,256,7168,256,8,0,0,asm,12000+22001,2154.157
gfx936,int8_w8a8_channel,torch.float16,2048,256,7168,256,8,0,0,asm,13000+23001,2193.4244
gfx936,int8_w8a8_channel,torch.float16,2304,256,7168,256,8,0,0,asm,13000+23001,2250.4602
gfx936,int8_w8a8_channel,torch.float16,2560,256,7168,256,8,0,0,asm,13000+23001,2375.4793
gfx936,int8_w8a8_channel,torch.float16,2816,256,7168,256,8,0,0,asm,13000+23001,2459.2772
gfx936,int8_w8a8_channel,torch.float16,3072,256,7168,256,8,0,0,asm,13000+23001,2531.6057
gfx936,int8_w8a8_channel,torch.float16,3328,256,7168,256,8,0,0,asm,13000+23001,2618.5448
gfx936,int8_w8a8_channel,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23001,2755.9934
gfx936,int8_w8a8_channel,torch.float16,3840,256,7168,256,8,0,0,asm,12001+22001,2926.2758
gfx936,int8_w8a8_channel,torch.float16,4096,256,7168,256,8,0,0,asm,13001+23001,3090.1328
gfx936,int8_w8a8_channel,torch.float16,4608,256,7168,256,8,0,0,asm,12001+22001,3489.0469
gfx936,int8_w8a8_channel,torch.float16,5120,256,7168,256,8,0,0,asm,13001+23001,3676.4831
gfx936,int8_w8a8_channel,torch.float16,5632,256,7168,256,8,0,0,asm,13001+23001,3816.7864
gfx936,int8_w8a8_channel,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23001,3877.2412
gfx936,int8_w8a8_channel,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23001,4027.0604
gfx936,int8_w8a8_channel,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23001,4210.3786
gfx936,int8_w8a8_channel,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23001,4462.4463
gfx936,int8_w8a8_channel,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23001,4854.6321
gfx936,int8_w8a8_channel,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23001,6054.3389
gfx936,int8_w8a8_channel,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23001,6973.4562
gfx936,int8_w8a8_channel,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23001,8029.3144
gfx936,int8_w8a8_channel,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23001,8966.4444
gfx936,int8_w8a8_channel,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23001,9653.696
gfx936,int8_w8a8_channel,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23001,13175.2086
gfx936,int8_w8a8_channel,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23001,17363.5772
gfx936,int8_w8a8_channel,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23001,21369.1494
gfx936,int8_w8a8_channel,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23001,25515.9519
gfx938,int8_w8a8_channel,torch.float16,1,128,7168,256,8,0,0,asm,10001+20101,63.2618
gfx938,int8_w8a8_channel,torch.float16,2,128,7168,256,8,0,0,asm,10002+20102,75.6895
gfx938,int8_w8a8_channel,torch.float16,3,128,7168,256,8,0,0,asm,10008+20102,87.3309
gfx938,int8_w8a8_channel,torch.float16,4,128,7168,256,8,0,0,asm,10008+20102,104.9443
gfx938,int8_w8a8_channel,torch.float16,5,128,7168,256,8,0,0,asm,10011+20102,131.5369
gfx938,int8_w8a8_channel,torch.float16,6,128,7168,256,8,0,0,asm,10011+20102,131.738
gfx938,int8_w8a8_channel,torch.float16,7,128,7168,256,8,0,0,asm,10011+20102,139.7052
gfx938,int8_w8a8_channel,torch.float16,8,128,7168,256,8,0,0,asm,10011+20102,147.422
gfx938,int8_w8a8_channel,torch.float16,9,128,7168,256,8,0,0,asm,10011+20102,160.4928
gfx938,int8_w8a8_channel,torch.float16,10,128,7168,256,8,0,0,asm,10013+20102,171.5614
gfx938,int8_w8a8_channel,torch.float16,11,128,7168,256,8,0,0,asm,10002+20102,201.6002
gfx938,int8_w8a8_channel,torch.float16,12,128,7168,256,8,0,0,asm,10002+20102,204.5267
gfx938,int8_w8a8_channel,torch.float16,13,128,7168,256,8,0,0,asm,10002+20102,209.5141
gfx938,int8_w8a8_channel,torch.float16,14,128,7168,256,8,0,0,asm,10008+20102,219.6596
gfx938,int8_w8a8_channel,torch.float16,15,128,7168,256,8,0,0,asm,10008+20102,222.4576
gfx938,int8_w8a8_channel,torch.float16,16,128,7168,256,8,0,0,asm,10008+20102,226.195
gfx938,int8_w8a8_channel,torch.float16,17,128,7168,256,8,0,0,asm,10009+20102,228.1325
gfx938,int8_w8a8_channel,torch.float16,18,128,7168,256,8,0,0,asm,10008+20102,236.953
gfx938,int8_w8a8_channel,torch.float16,20,128,7168,256,8,0,0,asm,10011+20102,258.4297
gfx938,int8_w8a8_channel,torch.float16,24,128,7168,256,8,0,0,asm,10012+20102,281.8882
gfx938,int8_w8a8_channel,torch.float16,28,128,7168,256,8,0,0,asm,10002+20102,335.2694
gfx938,int8_w8a8_channel,torch.float16,32,128,7168,256,8,0,0,asm,10002+20102,347.0314
gfx938,int8_w8a8_channel,torch.float16,34,128,7168,256,8,0,0,asm,10002+20102,340.4068
gfx938,int8_w8a8_channel,torch.float16,36,128,7168,256,8,0,0,asm,10002+20102,350.6017
gfx938,int8_w8a8_channel,torch.float16,40,128,7168,256,8,0,0,asm,10002+20102,371.7133
gfx938,int8_w8a8_channel,torch.float16,44,128,7168,256,8,0,0,asm,10002+20102,381.5184
gfx938,int8_w8a8_channel,torch.float16,48,128,7168,256,8,0,0,asm,10002+20102,387.3112
gfx938,int8_w8a8_channel,torch.float16,56,128,7168,256,8,0,0,asm,10013+20102,404.4723
gfx938,int8_w8a8_channel,torch.float16,64,128,7168,256,8,0,0,asm,10002+20102,426.9911
gfx938,int8_w8a8_channel,torch.float16,68,128,7168,256,8,0,0,asm,10001+20102,446.2539
gfx938,int8_w8a8_channel,torch.float16,72,128,7168,256,8,0,0,asm,10001+20102,455.8723
gfx938,int8_w8a8_channel,torch.float16,80,128,7168,256,8,0,0,asm,10002+20101,460.7386
gfx938,int8_w8a8_channel,torch.float16,88,128,7168,256,8,0,0,asm,10002+20102,462.5899
gfx938,int8_w8a8_channel,torch.float16,96,128,7168,256,8,0,0,asm,10002+20102,462.8021
gfx938,int8_w8a8_channel,torch.float16,104,128,7168,256,8,0,0,asm,10002+20102,478.4371
gfx938,int8_w8a8_channel,torch.float16,112,128,7168,256,8,0,0,asm,10002+20102,481.4893
gfx938,int8_w8a8_channel,torch.float16,128,128,7168,256,8,0,0,asm,10002+20102,487.6923
gfx938,int8_w8a8_channel,torch.float16,144,128,7168,256,8,0,0,asm,10002+20102,509.8789
gfx938,int8_w8a8_channel,torch.float16,160,128,7168,256,8,0,0,asm,10002+20102,515.3517
gfx938,int8_w8a8_channel,torch.float16,192,128,7168,256,8,0,0,asm,10002+20102,519.5833
gfx938,int8_w8a8_channel,torch.float16,224,128,7168,256,8,0,0,asm,10002+20102,527.8664
gfx938,int8_w8a8_channel,torch.float16,256,128,7168,256,8,0,0,asm,10002+20102,536.3813
gfx938,int8_w8a8_channel,torch.float16,320,128,7168,256,8,0,0,asm,10002+20102,555.8232
gfx938,int8_w8a8_channel,torch.float16,384,128,7168,256,8,0,0,asm,10012+20102,565.3493
gfx938,int8_w8a8_channel,torch.float16,448,128,7168,256,8,0,0,asm,11005+21102,610.3871
gfx938,int8_w8a8_channel,torch.float16,512,128,7168,256,8,0,0,asm,11005+21102,633.7347
gfx938,int8_w8a8_channel,torch.float16,576,128,7168,256,8,0,0,asm,11005+21102,684.5777
gfx938,int8_w8a8_channel,torch.float16,640,128,7168,256,8,0,0,asm,11005+21102,659.4904
gfx938,int8_w8a8_channel,torch.float16,704,128,7168,256,8,0,0,asm,11005+21102,667.2115
gfx938,int8_w8a8_channel,torch.float16,768,128,7168,256,8,0,0,asm,11003+21102,675.0842
gfx938,int8_w8a8_channel,torch.float16,832,128,7168,256,8,0,0,asm,11005+21102,688.4298
gfx938,int8_w8a8_channel,torch.float16,896,128,7168,256,8,0,0,asm,11005+21102,755.3507
gfx938,int8_w8a8_channel,torch.float16,960,128,7168,256,8,0,0,asm,11005+21102,763.7894
gfx938,int8_w8a8_channel,torch.float16,1024,128,7168,256,8,0,0,asm,11005+21102,841.7542
gfx938,int8_w8a8_channel,torch.float16,1152,128,7168,256,8,0,0,asm,12001+22001,977.5854
gfx938,int8_w8a8_channel,torch.float16,1280,128,7168,256,8,0,0,asm,12005+22001,969.4833
gfx938,int8_w8a8_channel,torch.float16,1408,128,7168,256,8,0,0,asm,12005+22001,1002.1966
gfx938,int8_w8a8_channel,torch.float16,1536,128,7168,256,8,0,0,asm,12003+22001,1033.5221
gfx938,int8_w8a8_channel,torch.float16,1664,128,7168,256,8,0,0,asm,12001+22001,1052.5143
gfx938,int8_w8a8_channel,torch.float16,1792,128,7168,256,8,0,0,asm,12001+22001,1151.6113
gfx938,int8_w8a8_channel,torch.float16,1920,128,7168,256,8,0,0,asm,12003+22101,1179.0246
gfx938,int8_w8a8_channel,torch.float16,2048,128,7168,256,8,0,0,asm,12001+22101,1328.5704
gfx938,int8_w8a8_channel,torch.float16,2304,128,7168,256,8,0,0,asm,13001+23001,1517.2547
gfx938,int8_w8a8_channel,torch.float16,2560,128,7168,256,8,0,0,asm,13001+23001,1572.8933
gfx938,int8_w8a8_channel,torch.float16,2816,128,7168,256,8,0,0,asm,13001+23001,1606.6615
gfx938,int8_w8a8_channel,torch.float16,3072,128,7168,256,8,0,0,asm,13001+23001,1634.9778
gfx938,int8_w8a8_channel,torch.float16,3328,128,7168,256,8,0,0,asm,13001+23001,1700.3595
gfx938,int8_w8a8_channel,torch.float16,3584,128,7168,256,8,0,0,asm,13001+23001,1774.1847
gfx938,int8_w8a8_channel,torch.float16,3840,128,7168,256,8,0,0,asm,13001+23001,1987.5334
gfx938,int8_w8a8_channel,torch.float16,4096,128,7168,256,8,0,0,asm,12001+22101,2207.8893
gfx938,int8_w8a8_channel,torch.float16,4608,128,7168,256,8,0,0,asm,12001+22101,2549.7134
gfx938,int8_w8a8_channel,torch.float16,5120,128,7168,256,8,0,0,asm,12001+22101,2702.7999
gfx938,int8_w8a8_channel,torch.float16,5632,128,7168,256,8,0,0,asm,12001+22101,2874.6924
gfx938,int8_w8a8_channel,torch.float16,6144,128,7168,256,8,0,0,asm,13001+23101,3113.1382
gfx938,int8_w8a8_channel,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23100,3219.0612
gfx938,int8_w8a8_channel,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23101,3310.4812
gfx938,int8_w8a8_channel,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23101,3438.692
gfx938,int8_w8a8_channel,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23101,3769.0124
gfx938,int8_w8a8_channel,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23101,4589.1196
gfx938,int8_w8a8_channel,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23101,5414.4453
gfx938,int8_w8a8_channel,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23101,6272.9851
gfx938,int8_w8a8_channel,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23101,6928.7073
gfx938,int8_w8a8_channel,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23101,7446.1985
gfx938,int8_w8a8_channel,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23101,10133.096
gfx938,int8_w8a8_channel,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23101,13291.5275
gfx938,int8_w8a8_channel,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15668.9581
gfx938,int8_w8a8_channel,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23101,18765.4355
gfx938,int8_w8a8_channel,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23101,22021.7106
gfx938,int8_w8a8_channel,torch.float16,65536,128,7168,256,8,0,0,asm,13001+23101,25347.7545
gfx938,int8_w8a8_channel,torch.float16,1,256,7168,256,8,0,0,asm,10002+20001,69.8059
gfx938,int8_w8a8_channel,torch.float16,2,256,7168,256,8,0,0,asm,10008+20001,105.3216
gfx938,int8_w8a8_channel,torch.float16,3,256,7168,256,8,0,0,asm,10011+20001,137.0302
gfx938,int8_w8a8_channel,torch.float16,4,256,7168,256,8,0,0,asm,10011+20001,166.402
gfx938,int8_w8a8_channel,torch.float16,5,256,7168,256,8,0,0,asm,10002+20001,199.3649
gfx938,int8_w8a8_channel,torch.float16,6,256,7168,256,8,0,0,asm,10008+20001,216.123
gfx938,int8_w8a8_channel,torch.float16,7,256,7168,256,8,0,0,asm,10008+20001,232.9755
gfx938,int8_w8a8_channel,torch.float16,8,256,7168,256,8,0,0,asm,10011+20001,248.2603
gfx938,int8_w8a8_channel,torch.float16,9,256,7168,256,8,0,0,asm,10011+20001,265.2203
gfx938,int8_w8a8_channel,torch.float16,10,256,7168,256,8,0,0,asm,10011+20001,282.6291
gfx938,int8_w8a8_channel,torch.float16,11,256,7168,256,8,0,0,asm,10002+20001,310.1867
gfx938,int8_w8a8_channel,torch.float16,12,256,7168,256,8,0,0,asm,10002+20001,321.9316
gfx938,int8_w8a8_channel,torch.float16,13,256,7168,256,8,0,0,asm,10008+20001,338.8822
gfx938,int8_w8a8_channel,torch.float16,14,256,7168,256,8,0,0,asm,10002+20001,358.7315
gfx938,int8_w8a8_channel,torch.float16,15,256,7168,256,8,0,0,asm,10011+20001,368.3992
gfx938,int8_w8a8_channel,torch.float16,16,256,7168,256,8,0,0,asm,10011+20001,378.1179
gfx938,int8_w8a8_channel,torch.float16,17,256,7168,256,8,0,0,asm,10011+20001,381.3561
gfx938,int8_w8a8_channel,torch.float16,18,256,7168,256,8,0,0,asm,10011+20001,397.2116
gfx938,int8_w8a8_channel,torch.float16,20,256,7168,256,8,0,0,asm,10002+20001,431.1681
gfx938,int8_w8a8_channel,torch.float16,24,256,7168,256,8,0,0,asm,10011+20001,479.9186
gfx938,int8_w8a8_channel,torch.float16,28,256,7168,256,8,0,0,asm,10002+20001,552.5507
gfx938,int8_w8a8_channel,torch.float16,32,256,7168,256,8,0,0,asm,10011+20001,587.4382
gfx938,int8_w8a8_channel,torch.float16,34,256,7168,256,8,0,0,asm,10011+20001,579.5075
gfx938,int8_w8a8_channel,torch.float16,36,256,7168,256,8,0,0,asm,10011+20001,600.686
gfx938,int8_w8a8_channel,torch.float16,40,256,7168,256,8,0,0,asm,10002+20001,623.1973
gfx938,int8_w8a8_channel,torch.float16,44,256,7168,256,8,0,0,asm,10002+20001,651.7723
gfx938,int8_w8a8_channel,torch.float16,48,256,7168,256,8,0,0,asm,10002+20001,663.6823
gfx938,int8_w8a8_channel,torch.float16,56,256,7168,256,8,0,0,asm,10002+20001,699.227
gfx938,int8_w8a8_channel,torch.float16,64,256,7168,256,8,0,0,asm,10002+20001,718.8464
gfx938,int8_w8a8_channel,torch.float16,68,256,7168,256,8,0,0,asm,10002+20001,727.4162
gfx938,int8_w8a8_channel,torch.float16,72,256,7168,256,8,0,0,asm,10002+20000,752.4242
gfx938,int8_w8a8_channel,torch.float16,80,256,7168,256,8,0,0,asm,10002+20001,798.6361
gfx938,int8_w8a8_channel,torch.float16,88,256,7168,256,8,0,0,asm,10011+20001,803.9207
gfx938,int8_w8a8_channel,torch.float16,96,256,7168,256,8,0,0,asm,10011+20001,797.7572
gfx938,int8_w8a8_channel,torch.float16,104,256,7168,256,8,0,0,asm,10002+20001,817.8816
gfx938,int8_w8a8_channel,torch.float16,112,256,7168,256,8,0,0,asm,10011+20001,819.8212
gfx938,int8_w8a8_channel,torch.float16,128,256,7168,256,8,0,0,asm,10002+20001,836.1965
gfx938,int8_w8a8_channel,torch.float16,144,256,7168,256,8,0,0,asm,10002+20001,844.6419
gfx938,int8_w8a8_channel,torch.float16,160,256,7168,256,8,0,0,asm,10002+20001,861.065
gfx938,int8_w8a8_channel,torch.float16,192,256,7168,256,8,0,0,asm,10002+20001,870.0983
gfx938,int8_w8a8_channel,torch.float16,224,256,7168,256,8,0,0,asm,10002+20001,904.8108
gfx938,int8_w8a8_channel,torch.float16,256,256,7168,256,8,0,0,asm,10002+20001,900.3962
gfx938,int8_w8a8_channel,torch.float16,320,256,7168,256,8,0,0,asm,10011+20001,938.3914
gfx938,int8_w8a8_channel,torch.float16,384,256,7168,256,8,0,0,asm,10011+20001,950.1246
gfx938,int8_w8a8_channel,torch.float16,448,256,7168,256,8,0,0,asm,11005+21001,991.3086
gfx938,int8_w8a8_channel,torch.float16,512,256,7168,256,8,0,0,asm,11005+21001,1024.873
gfx938,int8_w8a8_channel,torch.float16,576,256,7168,256,8,0,0,asm,11003+21001,1085.3904
gfx938,int8_w8a8_channel,torch.float16,640,256,7168,256,8,0,0,asm,11005+21001,1064.9267
gfx938,int8_w8a8_channel,torch.float16,704,256,7168,256,8,0,0,asm,11005+21001,1082.1236
gfx938,int8_w8a8_channel,torch.float16,768,256,7168,256,8,0,0,asm,11003+21001,1086.2148
gfx938,int8_w8a8_channel,torch.float16,832,256,7168,256,8,0,0,asm,11005+21001,1118.0076
gfx938,int8_w8a8_channel,torch.float16,896,256,7168,256,8,0,0,asm,11005+21001,1177.0868
gfx938,int8_w8a8_channel,torch.float16,960,256,7168,256,8,0,0,asm,11005+21001,1261.5258
gfx938,int8_w8a8_channel,torch.float16,1024,256,7168,256,8,0,0,asm,12001+22001,1321.1087
gfx938,int8_w8a8_channel,torch.float16,1152,256,7168,256,8,0,0,asm,12001+22001,1378.0109
gfx938,int8_w8a8_channel,torch.float16,1280,256,7168,256,8,0,0,asm,12001+22001,1392.1021
gfx938,int8_w8a8_channel,torch.float16,1408,256,7168,256,8,0,0,asm,12001+22001,1430.3588
gfx938,int8_w8a8_channel,torch.float16,1536,256,7168,256,8,0,0,asm,12001+22001,1464.291
gfx938,int8_w8a8_channel,torch.float16,1664,256,7168,256,8,0,0,asm,12003+22001,1505.5708
gfx938,int8_w8a8_channel,torch.float16,1792,256,7168,256,8,0,0,asm,12001+22001,1589.9691
gfx938,int8_w8a8_channel,torch.float16,1920,256,7168,256,8,0,0,asm,12001+22001,1632.3197
gfx938,int8_w8a8_channel,torch.float16,2048,256,7168,256,8,0,0,asm,12001+22001,1866.2468
gfx938,int8_w8a8_channel,torch.float16,2304,256,7168,256,8,0,0,asm,13001+23001,2048.1579
gfx938,int8_w8a8_channel,torch.float16,2560,256,7168,256,8,0,0,asm,13001+23001,2092.4777
gfx938,int8_w8a8_channel,torch.float16,2816,256,7168,256,8,0,0,asm,13001+23001,2139.2016
gfx938,int8_w8a8_channel,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23001,2186.3933
gfx938,int8_w8a8_channel,torch.float16,3328,256,7168,256,8,0,0,asm,13001+23001,2256.4647
gfx938,int8_w8a8_channel,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23001,2336.6121
gfx938,int8_w8a8_channel,torch.float16,3840,256,7168,256,8,0,0,asm,13001+23001,2576.566
gfx938,int8_w8a8_channel,torch.float16,4096,256,7168,256,8,0,0,asm,13001+23001,2972.2115
gfx938,int8_w8a8_channel,torch.float16,4608,256,7168,256,8,0,0,asm,12001+22001,3615.1791
gfx938,int8_w8a8_channel,torch.float16,5120,256,7168,256,8,0,0,asm,12001+22001,3819.4244
gfx938,int8_w8a8_channel,torch.float16,5632,256,7168,256,8,0,0,asm,12001+22001,4030.1803
gfx938,int8_w8a8_channel,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23001,4172.1696
gfx938,int8_w8a8_channel,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23001,4255.9334
gfx938,int8_w8a8_channel,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23001,4370.7083
gfx938,int8_w8a8_channel,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23001,4623.5482
gfx938,int8_w8a8_channel,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23001,5132.8724
gfx938,int8_w8a8_channel,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23001,6291.0284
gfx938,int8_w8a8_channel,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23001,7314.9996
gfx938,int8_w8a8_channel,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23001,8463.126
gfx938,int8_w8a8_channel,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23001,9513.7307
gfx938,int8_w8a8_channel,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23001,10340.0984
gfx938,int8_w8a8_channel,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23001,13947.7674
gfx938,int8_w8a8_channel,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23001,18301.4314
gfx938,int8_w8a8_channel,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23001,22619.4892
gfx938,int8_w8a8_channel,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23001,26910.4336
gfx938,int8_w8a8_channel,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23001,31283.1318
gfx938,int8_w8a8_channel,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23001,35592.7466
gfx938,f8_w8a8_channel,torch.float16,1,128,7168,256,8,0,0,asm,10000+20101,61.4201
gfx938,f8_w8a8_channel,torch.float16,2,128,7168,256,8,0,0,asm,10002+20102,74.3393
gfx938,f8_w8a8_channel,torch.float16,3,128,7168,256,8,0,0,asm,10009+20102,87.5437
gfx938,f8_w8a8_channel,torch.float16,4,128,7168,256,8,0,0,asm,10009+20102,104.5218
gfx938,f8_w8a8_channel,torch.float16,5,128,7168,256,8,0,0,asm,10011+20102,131.6919
gfx938,f8_w8a8_channel,torch.float16,6,128,7168,256,8,0,0,asm,10011+20102,136.3617
gfx938,f8_w8a8_channel,torch.float16,7,128,7168,256,8,0,0,asm,10011+20102,140.4929
gfx938,f8_w8a8_channel,torch.float16,8,128,7168,256,8,0,0,asm,10011+20102,146.7534
gfx938,f8_w8a8_channel,torch.float16,9,128,7168,256,8,0,0,asm,10011+20102,162.0682
gfx938,f8_w8a8_channel,torch.float16,10,128,7168,256,8,0,0,asm,10013+20102,174.0107
gfx938,f8_w8a8_channel,torch.float16,11,128,7168,256,8,0,0,asm,10002+20102,203.5942
gfx938,f8_w8a8_channel,torch.float16,12,128,7168,256,8,0,0,asm,10002+20102,207.1347
gfx938,f8_w8a8_channel,torch.float16,13,128,7168,256,8,0,0,asm,10002+20102,209.305
gfx938,f8_w8a8_channel,torch.float16,14,128,7168,256,8,0,0,asm,10008+20102,219.6352
gfx938,f8_w8a8_channel,torch.float16,15,128,7168,256,8,0,0,asm,10008+20102,221.8342
gfx938,f8_w8a8_channel,torch.float16,16,128,7168,256,8,0,0,asm,10009+20102,226.0433
gfx938,f8_w8a8_channel,torch.float16,17,128,7168,256,8,0,0,asm,10008+20102,228.4813
gfx938,f8_w8a8_channel,torch.float16,18,128,7168,256,8,0,0,asm,10002+20102,237.708
gfx938,f8_w8a8_channel,torch.float16,20,128,7168,256,8,0,0,asm,10011+20102,259.1725
gfx938,f8_w8a8_channel,torch.float16,24,128,7168,256,8,0,0,asm,10013+20102,281.3468
gfx938,f8_w8a8_channel,torch.float16,28,128,7168,256,8,0,0,asm,10002+20102,336.0654
gfx938,f8_w8a8_channel,torch.float16,32,128,7168,256,8,0,0,asm,10002+20102,349.288
gfx938,f8_w8a8_channel,torch.float16,34,128,7168,256,8,0,0,asm,10002+20102,337.0594
gfx938,f8_w8a8_channel,torch.float16,36,128,7168,256,8,0,0,asm,10002+20102,348.8132
gfx938,f8_w8a8_channel,torch.float16,40,128,7168,256,8,0,0,asm,10002+20102,369.2685
gfx938,f8_w8a8_channel,torch.float16,44,128,7168,256,8,0,0,asm,10002+20102,383.8079
gfx938,f8_w8a8_channel,torch.float16,48,128,7168,256,8,0,0,asm,10002+20102,388.2017
gfx938,f8_w8a8_channel,torch.float16,56,128,7168,256,8,0,0,asm,10002+20102,406.815
gfx938,f8_w8a8_channel,torch.float16,64,128,7168,256,8,0,0,asm,10002+20102,431.9513
gfx938,f8_w8a8_channel,torch.float16,68,128,7168,256,8,0,0,asm,10002+20102,465.6659
gfx938,f8_w8a8_channel,torch.float16,72,128,7168,256,8,0,0,asm,10001+20001,467.1784
gfx938,f8_w8a8_channel,torch.float16,80,128,7168,256,8,0,0,asm,10002+20102,454.265
gfx938,f8_w8a8_channel,torch.float16,88,128,7168,256,8,0,0,asm,10002+20102,466.2786
gfx938,f8_w8a8_channel,torch.float16,96,128,7168,256,8,0,0,asm,10002+20102,466.5357
gfx938,f8_w8a8_channel,torch.float16,104,128,7168,256,8,0,0,asm,10002+20102,476.3777
gfx938,f8_w8a8_channel,torch.float16,112,128,7168,256,8,0,0,asm,10002+20102,478.2608
gfx938,f8_w8a8_channel,torch.float16,128,128,7168,256,8,0,0,asm,10002+20102,491.1387
gfx938,f8_w8a8_channel,torch.float16,144,128,7168,256,8,0,0,asm,10002+20102,502.7711
gfx938,f8_w8a8_channel,torch.float16,160,128,7168,256,8,0,0,asm,10002+20102,516.1437
gfx938,f8_w8a8_channel,torch.float16,192,128,7168,256,8,0,0,asm,10002+20102,519.8894
gfx938,f8_w8a8_channel,torch.float16,224,128,7168,256,8,0,0,asm,10002+20102,532.9433
gfx938,f8_w8a8_channel,torch.float16,256,128,7168,256,8,0,0,asm,10002+20102,535.2698
gfx938,f8_w8a8_channel,torch.float16,320,128,7168,256,8,0,0,asm,10002+20102,559.5246
gfx938,f8_w8a8_channel,torch.float16,384,128,7168,256,8,0,0,asm,10011+20102,571.1548
gfx938,f8_w8a8_channel,torch.float16,448,128,7168,256,8,0,0,asm,11005+21102,612.7505
gfx938,f8_w8a8_channel,torch.float16,512,128,7168,256,8,0,0,asm,11007+21102,634.4969
gfx938,f8_w8a8_channel,torch.float16,576,128,7168,256,8,0,0,asm,11007+21102,681.9113
gfx938,f8_w8a8_channel,torch.float16,640,128,7168,256,8,0,0,asm,11005+21102,662.978
gfx938,f8_w8a8_channel,torch.float16,704,128,7168,256,8,0,0,asm,11005+21102,672.4385
gfx938,f8_w8a8_channel,torch.float16,768,128,7168,256,8,0,0,asm,11007+21102,690.7955
gfx938,f8_w8a8_channel,torch.float16,832,128,7168,256,8,0,0,asm,11005+21102,695.1789
gfx938,f8_w8a8_channel,torch.float16,896,128,7168,256,8,0,0,asm,11005+21102,753.6196
gfx938,f8_w8a8_channel,torch.float16,960,128,7168,256,8,0,0,asm,11005+21102,763.1376
gfx938,f8_w8a8_channel,torch.float16,1024,128,7168,256,8,0,0,asm,11003+21102,853.5372
gfx938,f8_w8a8_channel,torch.float16,1152,128,7168,256,8,0,0,asm,12001+22001,975.9654
gfx938,f8_w8a8_channel,torch.float16,1280,128,7168,256,8,0,0,asm,12001+22001,971.1162
gfx938,f8_w8a8_channel,torch.float16,1408,128,7168,256,8,0,0,asm,12005+22001,1000.0597
gfx938,f8_w8a8_channel,torch.float16,1536,128,7168,256,8,0,0,asm,12005+22001,1020.6874000000001
gfx938,f8_w8a8_channel,torch.float16,1664,128,7168,256,8,0,0,asm,12003+22001,1054.1529
gfx938,f8_w8a8_channel,torch.float16,1792,128,7168,256,8,0,0,asm,12001+22001,1156.2478
gfx938,f8_w8a8_channel,torch.float16,1920,128,7168,256,8,0,0,asm,12001+22001,1199.8661
gfx938,f8_w8a8_channel,torch.float16,2048,128,7168,256,8,0,0,asm,12001+22101,1344.1486
gfx938,f8_w8a8_channel,torch.float16,2304,128,7168,256,8,0,0,asm,13001+23001,1508.7961
gfx938,f8_w8a8_channel,torch.float16,2560,128,7168,256,8,0,0,asm,13001+23001,1546.9773
gfx938,f8_w8a8_channel,torch.float16,2816,128,7168,256,8,0,0,asm,13001+23001,1592.0286
gfx938,f8_w8a8_channel,torch.float16,3072,128,7168,256,8,0,0,asm,13001+23001,1634.9946
gfx938,f8_w8a8_channel,torch.float16,3328,128,7168,256,8,0,0,asm,13001+23001,1695.0105
gfx938,f8_w8a8_channel,torch.float16,3584,128,7168,256,8,0,0,asm,13001+23001,1754.4279
gfx938,f8_w8a8_channel,torch.float16,3840,128,7168,256,8,0,0,asm,13001+23001,1963.7276
gfx938,f8_w8a8_channel,torch.float16,4096,128,7168,256,8,0,0,asm,12001+22101,2231.6895
gfx938,f8_w8a8_channel,torch.float16,4608,128,7168,256,8,0,0,asm,12003+22101,2601.7681
gfx938,f8_w8a8_channel,torch.float16,5120,128,7168,256,8,0,0,asm,12001+22001,2735.0065
gfx938,f8_w8a8_channel,torch.float16,5632,128,7168,256,8,0,0,asm,12001+22001,2902.2632
gfx938,f8_w8a8_channel,torch.float16,6144,128,7168,256,8,0,0,asm,13001+23001,3103.9732
gfx938,f8_w8a8_channel,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23001,3204.7276
gfx938,f8_w8a8_channel,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23001,3293.3468
gfx938,f8_w8a8_channel,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23001,3450.7
gfx938,f8_w8a8_channel,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23101,3826.76
gfx938,f8_w8a8_channel,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23101,4667.9011
gfx938,f8_w8a8_channel,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23101,5498.0926
gfx938,f8_w8a8_channel,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23001,6370.1259
gfx938,f8_w8a8_channel,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23101,7049.5697
gfx938,f8_w8a8_channel,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23101,7572.7029
gfx938,f8_w8a8_channel,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23101,10339.622
gfx938,f8_w8a8_channel,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23101,13538.5271
gfx938,f8_w8a8_channel,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15969.9307
gfx938,f8_w8a8_channel,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23101,19164.5979
gfx938,f8_w8a8_channel,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23101,22502.1147
gfx938,f8_w8a8_channel,torch.float16,65536,128,7168,256,8,0,0,asm,13001+23101,25939.8595
gfx938,f8_w8a8_channel,torch.float16,1,256,7168,256,8,0,0,asm,10002+20001,69.9253
gfx938,f8_w8a8_channel,torch.float16,2,256,7168,256,8,0,0,asm,10008+20001,103.5412
gfx938,f8_w8a8_channel,torch.float16,3,256,7168,256,8,0,0,asm,10011+20001,138.3292
gfx938,f8_w8a8_channel,torch.float16,4,256,7168,256,8,0,0,asm,10011+20001,165.8163
gfx938,f8_w8a8_channel,torch.float16,5,256,7168,256,8,0,0,asm,10001+20001,199.2916
gfx938,f8_w8a8_channel,torch.float16,6,256,7168,256,8,0,0,asm,10008+20001,215.6812
gfx938,f8_w8a8_channel,torch.float16,7,256,7168,256,8,0,0,asm,10008+20001,232.7508
gfx938,f8_w8a8_channel,torch.float16,8,256,7168,256,8,0,0,asm,10011+20001,247.9325
gfx938,f8_w8a8_channel,torch.float16,9,256,7168,256,8,0,0,asm,10011+20001,262.6708
gfx938,f8_w8a8_channel,torch.float16,10,256,7168,256,8,0,0,asm,10011+20001,283.1306
gfx938,f8_w8a8_channel,torch.float16,11,256,7168,256,8,0,0,asm,10002+20001,309.4865
gfx938,f8_w8a8_channel,torch.float16,12,256,7168,256,8,0,0,asm,10002+20001,321.3357
gfx938,f8_w8a8_channel,torch.float16,13,256,7168,256,8,0,0,asm,10008+20001,338.1219
gfx938,f8_w8a8_channel,torch.float16,14,256,7168,256,8,0,0,asm,10002+20001,358.7315
gfx938,f8_w8a8_channel,torch.float16,15,256,7168,256,8,0,0,asm,10011+20001,368.3992
gfx938,f8_w8a8_channel,torch.float16,16,256,7168,256,8,0,0,asm,10011+20001,378.1179
gfx938,f8_w8a8_channel,torch.float16,17,256,7168,256,8,0,0,asm,10011+20001,381.3561
gfx938,f8_w8a8_channel,torch.float16,18,256,7168,256,8,0,0,asm,10011+20001,397.2116
gfx938,f8_w8a8_channel,torch.float16,20,256,7168,256,8,0,0,asm,10002+20001,431.1681
gfx938,f8_w8a8_channel,torch.float16,24,256,7168,256,8,0,0,asm,10011+20001,479.9186
gfx938,f8_w8a8_channel,torch.float16,28,256,7168,256,8,0,0,asm,10002+20001,552.5507
gfx938,f8_w8a8_channel,torch.float16,32,256,7168,256,8,0,0,asm,10011+20001,587.4382
gfx938,f8_w8a8_channel,torch.float16,34,256,7168,256,8,0,0,asm,10011+20001,579.5075
gfx938,f8_w8a8_channel,torch.float16,36,256,7168,256,8,0,0,asm,10011+20001,600.686
gfx938,f8_w8a8_channel,torch.float16,40,256,7168,256,8,0,0,asm,10002+20001,623.1973
gfx938,f8_w8a8_channel,torch.float16,44,256,7168,256,8,0,0,asm,10002+20001,651.7723
gfx938,f8_w8a8_channel,torch.float16,48,256,7168,256,8,0,0,asm,10002+20001,663.6823
gfx938,f8_w8a8_channel,torch.float16,56,256,7168,256,8,0,0,asm,10002+20001,699.227
gfx938,f8_w8a8_channel,torch.float16,64,256,7168,256,8,0,0,asm,10002+20001,718.8464
gfx938,f8_w8a8_channel,torch.float16,68,256,7168,256,8,0,0,asm,10002+20001,727.4162
gfx938,f8_w8a8_channel,torch.float16,72,256,7168,256,8,0,0,asm,10002+20000,752.4242
gfx938,f8_w8a8_channel,torch.float16,80,256,7168,256,8,0,0,asm,10002+20001,798.6361
gfx938,f8_w8a8_channel,torch.float16,88,256,7168,256,8,0,0,asm,10011+20001,803.9207
gfx938,f8_w8a8_channel,torch.float16,96,256,7168,256,8,0,0,asm,10011+20001,797.7572
gfx938,f8_w8a8_channel,torch.float16,104,256,7168,256,8,0,0,asm,10002+20001,817.8816
gfx938,f8_w8a8_channel,torch.float16,112,256,7168,256,8,0,0,asm,10011+20001,819.8212
gfx938,f8_w8a8_channel,torch.float16,128,256,7168,256,8,0,0,asm,10002+20001,836.1965
gfx938,f8_w8a8_channel,torch.float16,144,256,7168,256,8,0,0,asm,10002+20001,844.6419
gfx938,f8_w8a8_channel,torch.float16,160,256,7168,256,8,0,0,asm,10002+20001,861.065
gfx938,f8_w8a8_channel,torch.float16,192,256,7168,256,8,0,0,asm,10002+20001,870.0983
gfx938,f8_w8a8_channel,torch.float16,224,256,7168,256,8,0,0,asm,10002+20001,904.8108
gfx938,f8_w8a8_channel,torch.float16,256,256,7168,256,8,0,0,asm,10002+20001,900.3962
gfx938,f8_w8a8_channel,torch.float16,320,256,7168,256,8,0,0,asm,10011+20001,938.3914
gfx938,f8_w8a8_channel,torch.float16,384,256,7168,256,8,0,0,asm,10011+20001,950.1246
gfx938,f8_w8a8_channel,torch.float16,448,256,7168,256,8,0,0,asm,11005+21001,991.3086
gfx938,f8_w8a8_channel,torch.float16,512,256,7168,256,8,0,0,asm,11005+21001,1024.873
gfx938,f8_w8a8_channel,torch.float16,576,256,7168,256,8,0,0,asm,11003+21001,1085.3904
gfx938,f8_w8a8_channel,torch.float16,640,256,7168,256,8,0,0,asm,11005+21001,1064.9267
gfx938,f8_w8a8_channel,torch.float16,704,256,7168,256,8,0,0,asm,11005+21001,1082.1236
gfx938,f8_w8a8_channel,torch.float16,768,256,7168,256,8,0,0,asm,11003+21001,1086.2148
gfx938,f8_w8a8_channel,torch.float16,832,256,7168,256,8,0,0,asm,11005+21001,1118.0076
gfx938,f8_w8a8_channel,torch.float16,896,256,7168,256,8,0,0,asm,11005+21001,1177.0868
gfx938,f8_w8a8_channel,torch.float16,960,256,7168,256,8,0,0,asm,11005+21001,1261.5258
gfx938,f8_w8a8_channel,torch.float16,1024,256,7168,256,8,0,0,asm,12001+22001,1321.1087
gfx938,f8_w8a8_channel,torch.float16,1152,256,7168,256,8,0,0,asm,12001+22001,1378.0109
gfx938,f8_w8a8_channel,torch.float16,1280,256,7168,256,8,0,0,asm,12001+22001,1392.1021
gfx938,f8_w8a8_channel,torch.float16,1408,256,7168,256,8,0,0,asm,12001+22001,1430.3588
gfx938,f8_w8a8_channel,torch.float16,1536,256,7168,256,8,0,0,asm,12001+22001,1464.291
gfx938,f8_w8a8_channel,torch.float16,1664,256,7168,256,8,0,0,asm,12003+22001,1505.5708
gfx938,f8_w8a8_channel,torch.float16,1792,256,7168,256,8,0,0,asm,12001+22001,1589.9691
gfx938,f8_w8a8_channel,torch.float16,1920,256,7168,256,8,0,0,asm,12001+22001,1632.3197
gfx938,f8_w8a8_channel,torch.float16,2048,256,7168,256,8,0,0,asm,12001+22001,1866.2468
gfx938,f8_w8a8_channel,torch.float16,2304,256,7168,256,8,0,0,asm,13001+23001,2048.1579
gfx938,f8_w8a8_channel,torch.float16,2560,256,7168,256,8,0,0,asm,13001+23001,2092.4777
gfx938,f8_w8a8_channel,torch.float16,2816,256,7168,256,8,0,0,asm,13001+23001,2139.2016
gfx938,f8_w8a8_channel,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23001,2186.3933
gfx938,f8_w8a8_channel,torch.float16,3328,256,7168,256,8,0,0,asm,13001+23001,2256.4647
gfx938,f8_w8a8_channel,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23001,2336.6121
gfx938,f8_w8a8_channel,torch.float16,3840,256,7168,256,8,0,0,asm,13001+23001,2576.566
gfx938,f8_w8a8_channel,torch.float16,4096,256,7168,256,8,0,0,asm,13001+23001,2972.2115
gfx938,f8_w8a8_channel,torch.float16,4608,256,7168,256,8,0,0,asm,12001+22001,3615.1791
gfx938,f8_w8a8_channel,torch.float16,5120,256,7168,256,8,0,0,asm,12001+22001,3819.4244
gfx938,f8_w8a8_channel,torch.float16,5632,256,7168,256,8,0,0,asm,12001+22001,4030.1803
gfx938,f8_w8a8_channel,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23001,4172.1696
gfx938,f8_w8a8_channel,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23001,4255.9334
gfx938,f8_w8a8_channel,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23001,4370.7083
gfx938,f8_w8a8_channel,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23001,4623.5482
gfx938,f8_w8a8_channel,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23001,5132.8724
gfx938,f8_w8a8_channel,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23001,6291.0284
gfx938,f8_w8a8_channel,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23001,7314.9996
gfx938,f8_w8a8_channel,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23001,8463.126
gfx938,f8_w8a8_channel,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23001,9513.7307
gfx938,f8_w8a8_channel,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23001,10340.0984
gfx938,f8_w8a8_channel,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23001,13947.7674
gfx938,f8_w8a8_channel,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23001,18301.4314
gfx938,f8_w8a8_channel,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23001,22619.4892
gfx938,f8_w8a8_channel,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23001,26910.4336
gfx938,f8_w8a8_channel,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23001,31283.1318
gfx938,f8_w8a8_channel,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23001,35592.7466
gfx938,f8_w8a8_channel,torch.float16,1,352,4096,128,8,0,0,asm,10008+20001,59.0495
gfx938,f8_w8a8_channel,torch.float16,2,352,4096,128,8,0,0,asm,10011+20000,81.9294
gfx938,f8_w8a8_channel,torch.float16,4,352,4096,128,8,0,0,asm,10002+20000,130.3336
gfx938,f8_w8a8_channel,torch.float16,6,352,4096,128,8,0,0,asm,10011+20000,163.967
gfx938,f8_w8a8_channel,torch.float16,8,352,4096,128,8,0,0,asm,10008+20000,209.4489
gfx938,f8_w8a8_channel,torch.float16,12,352,4096,128,8,0,0,asm,10002+20000,275.9665
gfx938,f8_w8a8_channel,torch.float16,16,352,4096,128,8,0,0,asm,10011+20000,307.3096
gfx938,f8_w8a8_channel,torch.float16,20,352,4096,128,8,0,0,asm,10011+20000,360.1989
gfx938,f8_w8a8_channel,torch.float16,24,352,4096,128,8,0,0,asm,10011+20000,364.7463
gfx938,f8_w8a8_channel,torch.float16,28,352,4096,128,8,0,0,asm,10011+20000,372.2441
gfx938,f8_w8a8_channel,torch.float16,32,352,4096,128,8,0,0,asm,10011+20000,375.8735
gfx938,f8_w8a8_channel,torch.float16,36,352,4096,128,8,0,0,asm,10011+20000,390.2199
gfx938,f8_w8a8_channel,torch.float16,40,352,4096,128,8,0,0,asm,10011+20000,398.8093
gfx938,f8_w8a8_channel,torch.float16,44,352,4096,128,8,0,0,asm,10002+20000,422.6661
gfx938,f8_w8a8_channel,torch.float16,48,352,4096,128,8,0,0,asm,10002+20000,432.2913
gfx938,f8_w8a8_channel,torch.float16,56,352,4096,128,8,0,0,asm,10002+20000,431.5165
gfx938,f8_w8a8_channel,torch.float16,64,352,4096,128,8,0,0,asm,10002+20000,443.0479
gfx938,f8_w8a8_channel,torch.float16,72,352,4096,128,8,0,0,asm,10002+20000,437.2681
gfx938,f8_w8a8_channel,torch.float16,80,352,4096,128,8,0,0,asm,10011+20000,440.7965
gfx938,f8_w8a8_channel,torch.float16,96,352,4096,128,8,0,0,asm,10002+20000,443.7775
gfx938,f8_w8a8_channel,torch.float16,104,352,4096,128,8,0,0,asm,10002+20000,444.527
gfx938,f8_w8a8_channel,torch.float16,112,352,4096,128,8,0,0,asm,10002+20000,446.3712
gfx938,f8_w8a8_channel,torch.float16,128,352,4096,128,8,0,0,asm,10002+20000,446.9692
gfx938,f8_w8a8_channel,torch.float16,144,352,4096,128,8,0,0,asm,10011+20000,506.7920
gfx938,f8_w8a8_channel,torch.float16,160,352,4096,128,8,0,0,asm,10002+20000,459.6512
gfx938,f8_w8a8_channel,torch.float16,192,352,4096,128,8,0,0,asm,10011+20000,463.1543
gfx938,f8_w8a8_channel,torch.float16,224,352,4096,128,8,0,0,asm,11005+21000,482.8511
gfx938,f8_w8a8_channel,torch.float16,256,352,4096,128,8,0,0,asm,11005+21000,497.2088
gfx938,f8_w8a8_channel,torch.float16,320,352,4096,128,8,0,0,asm,11003+21000,509.8992
gfx938,f8_w8a8_channel,torch.float16,384,352,4096,128,8,0,0,asm,12005+22000,566.4802
gfx938,f8_w8a8_channel,torch.float16,448,352,4096,128,8,0,0,asm,11005+21000,548.4002
gfx938,f8_w8a8_channel,torch.float16,512,352,4096,128,8,0,0,asm,12001+22001,573.5201
gfx938,f8_w8a8_channel,torch.float16,768,352,4096,128,8,0,0,asm,12005+22000,661.2503
gfx938,f8_w8a8_channel,torch.float16,896,352,4096,128,8,0,0,asm,12005+22001,671.4481
gfx938,f8_w8a8_channel,torch.float16,960,352,4096,128,8,0,0,asm,12001+22001,693.4522
gfx938,f8_w8a8_channel,torch.float16,1024,352,4096,128,8,0,0,asm,12001+22001,761.8308
gfx938,f8_w8a8_channel,torch.float16,1280,352,4096,128,8,0,0,asm,13001+23001,849.0305
gfx938,f8_w8a8_channel,torch.float16,1536,352,4096,128,8,0,0,asm,13001+23001,899.2703
gfx938,f8_w8a8_channel,torch.float16,1920,352,4096,128,8,0,0,asm,13001+23001,1012.836
gfx938,f8_w8a8_channel,torch.float16,2048,352,4096,128,8,0,0,asm,13001+23001,1191.8837
gfx938,f8_w8a8_channel,torch.float16,2304,352,4096,128,8,0,0,asm,12005+22001,1445.8615
gfx938,f8_w8a8_channel,torch.float16,2560,352,4096,128,8,0,0,asm,12005+22001,1491.5539
gfx938,f8_w8a8_channel,torch.float16,3072,352,4096,128,8,0,0,asm,13001+23001,1566.3831
gfx938,f8_w8a8_channel,torch.float16,3584,352,4096,128,8,0,0,asm,13001+23001,1651.9658
gfx938,f8_w8a8_channel,torch.float16,3840,352,4096,128,8,0,0,asm,13001+23001,1747.4601
gfx938,f8_w8a8_channel,torch.float16,4096,352,4096,128,8,0,0,asm,13001+23001,1971.5349
gfx938,f8_w8a8_channel,torch.float16,4608,352,4096,128,8,0,0,asm,13001+23001,2280.3588
gfx938,f8_w8a8_channel,torch.float16,5120,352,4096,128,8,0,0,asm,13001+23001,2363.9879
gfx938,f8_w8a8_channel,torch.float16,6144,352,4096,128,8,0,0,asm,13001+23001,2770.6472
gfx938,f8_w8a8_channel,torch.float16,7168,352,4096,128,8,0,0,asm,13001+23001,3191.6222
gfx938,f8_w8a8_channel,torch.float16,8192,352,4096,128,8,0,0,asm,13001+23001,3572.9594
gfx938,f8_w8a8_channel,torch.float16,10240,352,4096,128,8,0,0,asm,13001+23001,4374.4799
gfx938,f8_w8a8_channel,torch.float16,12288,352,4096,128,8,0,0,asm,13001+23001,5152.6491
gfx938,f8_w8a8_channel,torch.float16,16384,352,4096,128,8,0,0,asm,13001+23001,6720.6083
gfx938,f8_w8a8_channel,torch.float16,24576,352,4096,128,8,0,0,asm,13001+23001,10204.6509
gfx938,f8_w8a8_channel,torch.float16,32768,352,4096,128,8,0,0,asm,13001+23001,13134.8606
gfx938,f8_w8a8_channel,torch.float16,1,352,4096,129,9,0,0,asm,10008+20000,59.1505
gfx938,f8_w8a8_channel,torch.float16,2,352,4096,129,9,0,0,asm,10011+20001,84.2789
gfx938,f8_w8a8_channel,torch.float16,4,352,4096,129,9,0,0,asm,10008+20000,133.5504
gfx938,f8_w8a8_channel,torch.float16,6,352,4096,129,9,0,0,asm,10011+20000,169.0869
gfx938,f8_w8a8_channel,torch.float16,8,352,4096,129,9,0,0,asm,10011+20000,214.6952
gfx938,f8_w8a8_channel,torch.float16,12,352,4096,129,9,0,0,asm,10011+20000,269.0782
gfx938,f8_w8a8_channel,torch.float16,16,352,4096,129,9,0,0,asm,10011+20000,304.5727
gfx938,f8_w8a8_channel,torch.float16,20,352,4096,129,9,0,0,asm,10011+20000,348.6201
gfx938,f8_w8a8_channel,torch.float16,24,352,4096,129,9,0,0,asm,10011+20000,358.1189
gfx938,f8_w8a8_channel,torch.float16,28,352,4096,129,9,0,0,asm,10011+20000,355.6209
gfx938,f8_w8a8_channel,torch.float16,32,352,4096,129,9,0,0,asm,10011+20000,375.9661
gfx938,f8_w8a8_channel,torch.float16,36,352,4096,129,9,0,0,asm,10011+20000,401.5798
gfx938,f8_w8a8_channel,torch.float16,40,352,4096,129,9,0,0,asm,10002+20000,416.6366
gfx938,f8_w8a8_channel,torch.float16,44,352,4096,129,9,0,0,asm,10002+20000,432.7375
gfx938,f8_w8a8_channel,torch.float16,48,352,4096,129,9,0,0,asm,10002+20000,436.7544
gfx938,f8_w8a8_channel,torch.float16,56,352,4096,129,9,0,0,asm,10011+20000,439.3396
gfx938,f8_w8a8_channel,torch.float16,64,352,4096,129,9,0,0,asm,10002+20000,448.3868
gfx938,f8_w8a8_channel,torch.float16,72,352,4096,129,9,0,0,asm,10011+20000,443.5838
gfx938,f8_w8a8_channel,torch.float16,80,352,4096,129,9,0,0,asm,10002+20000,446.7838
gfx938,f8_w8a8_channel,torch.float16,96,352,4096,129,9,0,0,asm,10002+20000,449.3269
gfx938,f8_w8a8_channel,torch.float16,104,352,4096,129,9,0,0,asm,10002+20000,452.3079
gfx938,f8_w8a8_channel,torch.float16,112,352,4096,129,9,0,0,asm,10002+20000,451.1291
gfx938,f8_w8a8_channel,torch.float16,128,352,4096,129,9,0,0,asm,10002+20000,454.4974
gfx938,f8_w8a8_channel,torch.float16,144,352,4096,129,9,0,0,asm,10002+20001,481.6721
gfx938,f8_w8a8_channel,torch.float16,160,352,4096,129,9,0,0,asm,10011+20000,459.5079
gfx938,f8_w8a8_channel,torch.float16,192,352,4096,129,9,0,0,asm,11005+21000,480.771
gfx938,f8_w8a8_channel,torch.float16,224,352,4096,129,9,0,0,asm,11005+21000,488.4005
gfx938,f8_w8a8_channel,torch.float16,256,352,4096,129,9,0,0,asm,11005+21000,495.8952
gfx938,f8_w8a8_channel,torch.float16,320,352,4096,129,9,0,0,asm,11005+21000,511.9877
gfx938,f8_w8a8_channel,torch.float16,384,352,4096,129,9,0,0,asm,11005+21000,551.8949
gfx938,f8_w8a8_channel,torch.float16,448,352,4096,129,9,0,0,asm,12005+22001,566.3791
gfx938,f8_w8a8_channel,torch.float16,512,352,4096,129,9,0,0,asm,12005+22001,582.6737
gfx938,f8_w8a8_channel,torch.float16,768,352,4096,129,9,0,0,asm,12001+22001,631.3219
gfx938,f8_w8a8_channel,torch.float16,896,352,4096,129,9,0,0,asm,12001+22001,741.4014
gfx938,f8_w8a8_channel,torch.float16,960,352,4096,129,9,0,0,asm,12001+22001,828.7526
gfx938,f8_w8a8_channel,torch.float16,1024,352,4096,129,9,0,0,asm,13001+23001,848.8536
gfx938,f8_w8a8_channel,torch.float16,1280,352,4096,129,9,0,0,asm,13001+23001,876.4829
gfx938,f8_w8a8_channel,torch.float16,1536,352,4096,129,9,0,0,asm,13001+23001,915.5733
gfx938,f8_w8a8_channel,torch.float16,1920,352,4096,129,9,0,0,asm,13001+23001,1321.8536
gfx938,f8_w8a8_channel,torch.float16,2048,352,4096,129,9,0,0,asm,12001+22001,1418.2911
gfx938,f8_w8a8_channel,torch.float16,2304,352,4096,129,9,0,0,asm,12001+22001,1505.9959
gfx938,f8_w8a8_channel,torch.float16,2560,352,4096,129,9,0,0,asm,13001+23001,1598.4671
gfx938,f8_w8a8_channel,torch.float16,3072,352,4096,129,9,0,0,asm,13001+23001,1680.7319
gfx938,f8_w8a8_channel,torch.float16,3584,352,4096,129,9,0,0,asm,13001+23001,1969.1433
gfx938,f8_w8a8_channel,torch.float16,3840,352,4096,129,9,0,0,asm,13001+23001,2186.6076
gfx938,f8_w8a8_channel,torch.float16,4096,352,4096,129,9,0,0,asm,13001+23001,2298.5144
gfx938,f8_w8a8_channel,torch.float16,4608,352,4096,129,9,0,0,asm,13001+23001,2375.6426
gfx938,f8_w8a8_channel,torch.float16,5120,352,4096,129,9,0,0,asm,13001+23001,2498.682
gfx938,f8_w8a8_channel,torch.float16,6144,352,4096,129,9,0,0,asm,13001+23001,3104.0772
gfx938,f8_w8a8_channel,torch.float16,7168,352,4096,129,9,0,0,asm,13001+23001,3422.5768
gfx938,f8_w8a8_channel,torch.float16,8192,352,4096,129,9,0,0,asm,13001+23001,4048.6372
gfx938,f8_w8a8_channel,torch.float16,10240,352,4096,129,9,0,0,asm,13001+23001,5000.6413
gfx938,f8_w8a8_channel,torch.float16,12288,352,4096,129,9,0,0,asm,13001+23001,5698.078
gfx938,f8_w8a8_channel,torch.float16,16384,352,4096,129,9,0,0,asm,13001+23001,7470.3985
gfx938,f8_w8a8_channel,torch.float16,24576,352,4096,129,9,0,0,asm,13001+23001,11072.2942
gfx938,f8_w8a8_channel,torch.float16,32768,352,4096,129,9,0,0,asm,13001+23001,14596.8846
gfx936,int8_w8a8_channel,torch.float16,1,384,3072,256,8,0,0,asm,10008+20000,56.8264
gfx936,int8_w8a8_channel,torch.float16,2,384,3072,256,8,0,0,asm,10013+20000,81.7951
gfx936,int8_w8a8_channel,torch.float16,4,384,3072,256,8,0,0,asm,10002+20000,132.7506
gfx936,int8_w8a8_channel,torch.float16,6,384,3072,256,8,0,0,asm,10002+20000,179.5884
gfx936,int8_w8a8_channel,torch.float16,8,384,3072,256,8,0,0,asm,10002+20000,215.5043
gfx936,int8_w8a8_channel,torch.float16,12,384,3072,256,8,0,0,asm,10002+20000,285.9295
gfx936,int8_w8a8_channel,torch.float16,16,384,3072,256,8,0,0,asm,10002+20000,345.4998
gfx936,int8_w8a8_channel,torch.float16,24,384,3072,256,8,0,0,asm,10002+20000,455.0041
gfx936,int8_w8a8_channel,torch.float16,32,384,3072,256,8,0,0,asm,10002+20000,557.1627
gfx936,int8_w8a8_channel,torch.float16,36,384,3072,256,8,0,0,asm,10002+20000,575.2362
gfx936,int8_w8a8_channel,torch.float16,48,384,3072,256,8,0,0,asm,10002+20000,648.0703
gfx936,int8_w8a8_channel,torch.float16,56,384,3072,256,8,0,0,asm,10002+20000,681.6115
gfx936,int8_w8a8_channel,torch.float16,64,384,3072,256,8,0,0,asm,10002+20000,709.3423
gfx936,int8_w8a8_channel,torch.float16,72,384,3072,256,8,0,0,asm,10002+20000,733.8225
gfx936,int8_w8a8_channel,torch.float16,80,384,3072,256,8,0,0,asm,10002+20000,762.3616
gfx936,int8_w8a8_channel,torch.float16,88,384,3072,256,8,0,0,asm,10002+20000,786.6734
gfx936,int8_w8a8_channel,torch.float16,96,384,3072,256,8,0,0,asm,10002+20000,799.2798
gfx936,int8_w8a8_channel,torch.float16,100,384,3072,256,8,0,0,asm,10002+20000,800.8546
gfx936,int8_w8a8_channel,torch.float16,112,384,3072,256,8,0,0,asm,10002+20000,818.8457
gfx936,int8_w8a8_channel,torch.float16,128,384,3072,256,8,0,0,asm,10002+20000,839.4823
gfx936,int8_w8a8_channel,torch.float16,144,384,3072,256,8,0,0,asm,10002+20000,847.5918
gfx936,int8_w8a8_channel,torch.float16,160,384,3072,256,8,0,0,asm,10002+20000,856.3665
gfx936,int8_w8a8_channel,torch.float16,192,384,3072,256,8,0,0,asm,10002+20000,871.7264
gfx936,int8_w8a8_channel,torch.float16,224,384,3072,256,8,0,0,asm,10002+20000,887.1116
gfx936,int8_w8a8_channel,torch.float16,256,384,3072,256,8,0,0,asm,10002+20000,899.8696
gfx936,int8_w8a8_channel,torch.float16,320,384,3072,256,8,0,0,asm,10002+20000,925.1746
gfx936,int8_w8a8_channel,torch.float16,384,384,3072,256,8,0,0,asm,11007+21000,950.7745
gfx936,int8_w8a8_channel,torch.float16,448,384,3072,256,8,0,0,asm,11007+21000,963.7851
gfx936,int8_w8a8_channel,torch.float16,512,384,3072,256,8,0,0,asm,11007+21000,983.2628
gfx936,int8_w8a8_channel,torch.float16,640,384,3072,256,8,0,0,asm,11007+21000,1016.4499
gfx936,int8_w8a8_channel,torch.float16,768,384,3072,256,8,0,0,asm,11007+21000,1044.2646
gfx936,int8_w8a8_channel,torch.float16,896,384,3072,256,8,0,0,asm,11007+21001,1079.5319
gfx936,int8_w8a8_channel,torch.float16,1024,384,3072,256,8,0,0,asm,12005+22001,1101.6539
gfx936,int8_w8a8_channel,torch.float16,1280,384,3072,256,8,0,0,asm,12005+22001,1150.9423
gfx936,int8_w8a8_channel,torch.float16,1536,384,3072,256,8,0,0,asm,12005+22001,1212.8369
gfx936,int8_w8a8_channel,torch.float16,2048,384,3072,256,8,0,0,asm,12001+22001,1368.7025
gfx936,int8_w8a8_channel,torch.float16,2304,384,3072,256,8,0,0,asm,13001+23001,1423.6751
gfx936,int8_w8a8_channel,torch.float16,2560,384,3072,256,8,0,0,asm,13001+23001,1469.0813
gfx936,int8_w8a8_channel,torch.float16,3072,384,3072,256,8,0,0,asm,13001+23001,1561.0895
gfx936,int8_w8a8_channel,torch.float16,3584,384,3072,256,8,0,0,asm,13001+23001,1670.9839
gfx936,int8_w8a8_channel,torch.float16,4096,384,3072,256,8,0,0,asm,13001+23001,1887.3709
gfx936,int8_w8a8_channel,torch.float16,5120,384,3072,256,8,0,0,asm,13001+23001,2325.1719
gfx936,int8_w8a8_channel,torch.float16,6144,384,3072,256,8,0,0,asm,13001+23001,2460.3279
gfx936,int8_w8a8_channel,torch.float16,7168,384,3072,256,8,0,0,asm,13001+23001,2649.5652
gfx936,int8_w8a8_channel,torch.float16,8192,384,3072,256,8,0,0,asm,13001+23001,3069.7829
gfx936,int8_w8a8_channel,torch.float16,10240,384,3072,256,8,0,0,asm,13001+23001,3692.2064
gfx936,int8_w8a8_channel,torch.float16,12288,384,3072,256,8,0,0,asm,13001+23001,4303.6906
gfx936,int8_w8a8_channel,torch.float16,16384,384,3072,256,8,0,0,asm,13001+23001,5566.5242
gfx936,int8_w8a8_channel,torch.float16,24576,384,3072,256,8,0,0,asm,13001+23001,8120.7216
gfx936,int8_w8a8_channel,torch.float16,32768,384,3072,256,8,0,0,asm,13001+23001,10670.8687
gfx936,int8_w8a8_channel,torch.float16,1,192,3072,256,8,0,0,asm,10002+20000,44.6414
gfx936,int8_w8a8_channel,torch.float16,2,192,3072,256,8,0,0,asm,10008+20000,58.1486
gfx936,int8_w8a8_channel,torch.float16,4,192,3072,256,8,0,0,asm,10002+20000,84.5319
gfx936,int8_w8a8_channel,torch.float16,6,192,3072,256,8,0,0,asm,10002+20000,111.858
gfx936,int8_w8a8_channel,torch.float16,8,192,3072,256,8,0,0,asm,10008+20001,130.1991
gfx936,int8_w8a8_channel,torch.float16,12,192,3072,256,8,0,0,asm,10002+20000,173.3315
gfx936,int8_w8a8_channel,torch.float16,16,192,3072,256,8,0,0,asm,10002+20000,204.5231
gfx936,int8_w8a8_channel,torch.float16,24,192,3072,256,8,0,0,asm,10002+20000,261.8589
gfx936,int8_w8a8_channel,torch.float16,32,192,3072,256,8,0,0,asm,10002+20001,320.0092
gfx936,int8_w8a8_channel,torch.float16,36,192,3072,256,8,0,0,asm,10002+20001,322.6504
gfx936,int8_w8a8_channel,torch.float16,48,192,3072,256,8,0,0,asm,10002+20001,361.5388
gfx936,int8_w8a8_channel,torch.float16,56,192,3072,256,8,0,0,asm,10002+20001,380.0229
gfx936,int8_w8a8_channel,torch.float16,64,192,3072,256,8,0,0,asm,10002+20001,391.8629
gfx936,int8_w8a8_channel,torch.float16,72,192,3072,256,8,0,0,asm,10002+20001,410.7261
gfx936,int8_w8a8_channel,torch.float16,80,192,3072,256,8,0,0,asm,10002+20001,423.1218
gfx936,int8_w8a8_channel,torch.float16,88,192,3072,256,8,0,0,asm,10002+20001,437.1513
gfx936,int8_w8a8_channel,torch.float16,96,192,3072,256,8,0,0,asm,10002+20001,440.9997
gfx936,int8_w8a8_channel,torch.float16,100,192,3072,256,8,0,0,asm,10002+20001,443.8797
gfx936,int8_w8a8_channel,torch.float16,112,192,3072,256,8,0,0,asm,10002+20001,451.1302
gfx936,int8_w8a8_channel,torch.float16,128,192,3072,256,8,0,0,asm,10002+20001,462.8607
gfx936,int8_w8a8_channel,torch.float16,144,192,3072,256,8,0,0,asm,10002+20001,469.9682
gfx936,int8_w8a8_channel,torch.float16,160,192,3072,256,8,0,0,asm,10002+20001,474.6839
gfx936,int8_w8a8_channel,torch.float16,192,192,3072,256,8,0,0,asm,10002+20001,485.3197
gfx936,int8_w8a8_channel,torch.float16,224,192,3072,256,8,0,0,asm,10002+20001,491.1639
gfx936,int8_w8a8_channel,torch.float16,256,192,3072,256,8,0,0,asm,10002+20001,498.7007
gfx936,int8_w8a8_channel,torch.float16,320,192,3072,256,8,0,0,asm,10002+20001,512.8228
gfx936,int8_w8a8_channel,torch.float16,384,192,3072,256,8,0,0,asm,10002+20001,533.9512
gfx936,int8_w8a8_channel,torch.float16,448,192,3072,256,8,0,0,asm,11006+21001,550.4481
gfx936,int8_w8a8_channel,torch.float16,512,192,3072,256,8,0,0,asm,11006+21001,566.9281
gfx936,int8_w8a8_channel,torch.float16,640,192,3072,256,8,0,0,asm,11004+21001,590.7595
gfx936,int8_w8a8_channel,torch.float16,768,192,3072,256,8,0,0,asm,11004+21001,620.5279
gfx936,int8_w8a8_channel,torch.float16,896,192,3072,256,8,0,0,asm,11005+21001,647.4415
gfx936,int8_w8a8_channel,torch.float16,1024,192,3072,256,8,0,0,asm,12004+22001,686.1783
gfx936,int8_w8a8_channel,torch.float16,1280,192,3072,256,8,0,0,asm,12004+22001,723.6267
gfx936,int8_w8a8_channel,torch.float16,1536,192,3072,256,8,0,0,asm,12000+22001,776.4603
gfx936,int8_w8a8_channel,torch.float16,2048,192,3072,256,8,0,0,asm,12001+22001,931.5421
gfx936,int8_w8a8_channel,torch.float16,2304,192,3072,256,8,0,0,asm,13001+23001,1029.8156
gfx936,int8_w8a8_channel,torch.float16,2560,192,3072,256,8,0,0,asm,13001+23001,1062.6493
gfx936,int8_w8a8_channel,torch.float16,3072,192,3072,256,8,0,0,asm,13001+23001,1136.1481
gfx936,int8_w8a8_channel,torch.float16,3584,192,3072,256,8,0,0,asm,13000+23001,1235.8199
gfx936,int8_w8a8_channel,torch.float16,4096,192,3072,256,8,0,0,asm,13001+23001,1479.2555
gfx936,int8_w8a8_channel,torch.float16,5120,192,3072,256,8,0,0,asm,12000+22001,1810.9182
gfx936,int8_w8a8_channel,torch.float16,6144,192,3072,256,8,0,0,asm,13001+23001,2028.7453
gfx936,int8_w8a8_channel,torch.float16,7168,192,3072,256,8,0,0,asm,13001+23001,2175.0862
gfx936,int8_w8a8_channel,torch.float16,8192,192,3072,256,8,0,0,asm,13001+23001,2538.3363
gfx936,int8_w8a8_channel,torch.float16,10240,192,3072,256,8,0,0,asm,13001+23001,3077.1904
gfx936,int8_w8a8_channel,torch.float16,12288,192,3072,256,8,0,0,asm,13001+23001,3606.2003
gfx936,int8_w8a8_channel,torch.float16,16384,192,3072,256,8,0,0,asm,13001+23001,4650.6454
gfx936,int8_w8a8_channel,torch.float16,24576,192,3072,256,8,0,0,asm,13001+23001,6805.7334
gfx936,int8_w8a8_channel,torch.float16,32768,192,3072,256,8,0,0,asm,13001+23001,8965.0994
gfx936,int8_w8a8_channel,torch.float16,1,192,5120,160,8,0,0,asm,10002+20000,51.2097
gfx936,int8_w8a8_channel,torch.float16,2,192,5120,160,8,0,0,asm,10009+20001,72.2287
gfx936,int8_w8a8_channel,torch.float16,4,192,5120,160,8,0,0,asm,10002+20000,107.8833
gfx936,int8_w8a8_channel,torch.float16,6,192,5120,160,8,0,0,asm,10001+20000,147.9592
gfx936,int8_w8a8_channel,torch.float16,8,192,5120,160,8,0,0,asm,10002+20000,183.6054
gfx936,int8_w8a8_channel,torch.float16,12,192,5120,160,8,0,0,asm,10002+20001,251.9926
gfx936,int8_w8a8_channel,torch.float16,16,192,5120,160,8,0,0,asm,10002+20001,294.4095
gfx936,int8_w8a8_channel,torch.float16,24,192,5120,160,8,0,0,asm,10002+20001,354.6758
gfx936,int8_w8a8_channel,torch.float16,32,192,5120,160,8,0,0,asm,10002+20001,398.502
gfx936,int8_w8a8_channel,torch.float16,36,192,5120,160,8,0,0,asm,10002+20001,409.6315
gfx936,int8_w8a8_channel,torch.float16,48,192,5120,160,8,0,0,asm,10002+20001,437.9347
gfx936,int8_w8a8_channel,torch.float16,56,192,5120,160,8,0,0,asm,10002+20001,454.9199
gfx936,int8_w8a8_channel,torch.float16,64,192,5120,160,8,0,0,asm,10002+20001,460.5957
gfx936,int8_w8a8_channel,torch.float16,72,192,5120,160,8,0,0,asm,10002+20001,468.8146
gfx936,int8_w8a8_channel,torch.float16,80,192,5120,160,8,0,0,asm,10002+20001,475.0883
gfx936,int8_w8a8_channel,torch.float16,88,192,5120,160,8,0,0,asm,10002+20001,478.4988
gfx936,int8_w8a8_channel,torch.float16,96,192,5120,160,8,0,0,asm,10002+20001,482.1788
gfx936,int8_w8a8_channel,torch.float16,100,192,5120,160,8,0,0,asm,10002+20001,486.3304
gfx936,int8_w8a8_channel,torch.float16,112,192,5120,160,8,0,0,asm,10002+20001,492.0398
gfx936,int8_w8a8_channel,torch.float16,128,192,5120,160,8,0,0,asm,10002+20001,496.6546
gfx936,int8_w8a8_channel,torch.float16,144,192,5120,160,8,0,0,asm,10002+20001,503.2904
gfx936,int8_w8a8_channel,torch.float16,160,192,5120,160,8,0,0,asm,10002+20001,506.4402
gfx936,int8_w8a8_channel,torch.float16,192,192,5120,160,8,0,0,asm,10002+20001,516.1665
gfx936,int8_w8a8_channel,torch.float16,224,192,5120,160,8,0,0,asm,10002+20001,529.9265
gfx936,int8_w8a8_channel,torch.float16,256,192,5120,160,8,0,0,asm,10002+20001,540.7391
gfx936,int8_w8a8_channel,torch.float16,320,192,5120,160,8,0,0,asm,11006+21001,567.9896
gfx936,int8_w8a8_channel,torch.float16,384,192,5120,160,8,0,0,asm,11006+21001,584.0148
gfx936,int8_w8a8_channel,torch.float16,448,192,5120,160,8,0,0,asm,11006+21001,599.0296
gfx936,int8_w8a8_channel,torch.float16,512,192,5120,160,8,0,0,asm,11005+21001,634.3727
gfx936,int8_w8a8_channel,torch.float16,640,192,5120,160,8,0,0,asm,12001+22001,682.2043
gfx936,int8_w8a8_channel,torch.float16,768,192,5120,160,8,0,0,asm,12001+22001,709.539
gfx936,int8_w8a8_channel,torch.float16,896,192,5120,160,8,0,0,asm,12001+22001,739.1137
gfx936,int8_w8a8_channel,torch.float16,1024,192,5120,160,8,0,0,asm,12004+22001,779.4253
gfx936,int8_w8a8_channel,torch.float16,1280,192,5120,160,8,0,0,asm,12000+22001,909.4463
gfx936,int8_w8a8_channel,torch.float16,1536,192,5120,160,8,0,0,asm,13001+23001,1025.7494
gfx936,int8_w8a8_channel,torch.float16,2048,192,5120,160,8,0,0,asm,13001+23001,1125.4882
gfx936,int8_w8a8_channel,torch.float16,2304,192,5120,160,8,0,0,asm,13001+23001,1233.5892
gfx936,int8_w8a8_channel,torch.float16,2560,192,5120,160,8,0,0,asm,12000+22001,1461.5554
gfx936,int8_w8a8_channel,torch.float16,3072,192,5120,160,8,0,0,asm,12000+22001,1716.0143
gfx936,int8_w8a8_channel,torch.float16,3584,192,5120,160,8,0,0,asm,12000+22001,1865.3784
gfx936,int8_w8a8_channel,torch.float16,4096,192,5120,160,8,0,0,asm,13001+23001,1995.8962
gfx936,int8_w8a8_channel,torch.float16,5120,192,5120,160,8,0,0,asm,13001+23001,2466.4559
gfx936,int8_w8a8_channel,torch.float16,6144,192,5120,160,8,0,0,asm,13001+23001,2914.4052
gfx936,int8_w8a8_channel,torch.float16,7168,192,5120,160,8,0,0,asm,13001+23001,3161.0576
gfx936,int8_w8a8_channel,torch.float16,8192,192,5120,160,8,0,0,asm,13001+23001,3814.2362
gfx936,int8_w8a8_channel,torch.float16,10240,192,5120,160,8,0,0,asm,13001+23001,4517.2759
gfx936,int8_w8a8_channel,torch.float16,12288,192,5120,160,8,0,0,asm,13001+23001,5242.8252
gfx936,int8_w8a8_channel,torch.float16,16384,192,5120,160,8,0,0,asm,13001+23001,7024.2813
gfx936,int8_w8a8_channel,torch.float16,24576,192,5120,160,8,0,0,asm,13001+23001,10233.6104
gfx936,int8_w8a8_channel,torch.float16,32768,192,5120,160,8,0,0,asm,13001+23001,13478.1774
gfx936,int8_w8a8_channel,torch.float16,1,96,5120,160,8,0,0,asm,10001+20000,43.2436
gfx936,int8_w8a8_channel,torch.float16,2,96,5120,160,8,0,0,asm,10002+20001,54.5699
gfx936,int8_w8a8_channel,torch.float16,4,96,5120,160,8,0,0,asm,10008+20001,75.2353
gfx936,int8_w8a8_channel,torch.float16,6,96,5120,160,8,0,0,asm,10011+20001,94.9994
gfx936,int8_w8a8_channel,torch.float16,8,96,5120,160,8,0,0,asm,10002+20001,112.7595
gfx936,int8_w8a8_channel,torch.float16,12,96,5120,160,8,0,0,asm,10002+20001,153.0122
gfx936,int8_w8a8_channel,torch.float16,16,96,5120,160,8,0,0,asm,10002+20001,173.0712
gfx936,int8_w8a8_channel,torch.float16,24,96,5120,160,8,0,0,asm,10002+20001,204.1503
gfx936,int8_w8a8_channel,torch.float16,32,96,5120,160,8,0,0,asm,10002+20001,235.4881
gfx936,int8_w8a8_channel,torch.float16,36,96,5120,160,8,0,0,asm,10002+20001,235.5018
gfx936,int8_w8a8_channel,torch.float16,48,96,5120,160,8,0,0,asm,10002+20001,249.2198
gfx936,int8_w8a8_channel,torch.float16,56,96,5120,160,8,0,0,asm,10002+20001,262.0619
gfx936,int8_w8a8_channel,torch.float16,64,96,5120,160,8,0,0,asm,10002+20001,265.0346
gfx936,int8_w8a8_channel,torch.float16,72,96,5120,160,8,0,0,asm,10008+20001,270.1714
gfx936,int8_w8a8_channel,torch.float16,80,96,5120,160,8,0,0,asm,10002+20001,271.9567
gfx936,int8_w8a8_channel,torch.float16,88,96,5120,160,8,0,0,asm,10002+20001,272.5714
gfx936,int8_w8a8_channel,torch.float16,96,96,5120,160,8,0,0,asm,10008+20001,277.5483
gfx936,int8_w8a8_channel,torch.float16,100,96,5120,160,8,0,0,asm,10002+20001,280.3778
gfx936,int8_w8a8_channel,torch.float16,112,96,5120,160,8,0,0,asm,10002+20001,281.6999
gfx936,int8_w8a8_channel,torch.float16,128,96,5120,160,8,0,0,asm,10002+20001,285.6494
gfx936,int8_w8a8_channel,torch.float16,144,96,5120,160,8,0,0,asm,10002+20001,290.7609
gfx936,int8_w8a8_channel,torch.float16,160,96,5120,160,8,0,0,asm,10001+20001,296.5799
gfx936,int8_w8a8_channel,torch.float16,192,96,5120,160,8,0,0,asm,10002+20001,300.6978
gfx936,int8_w8a8_channel,torch.float16,224,96,5120,160,8,0,0,asm,10002+20001,310.3484
gfx936,int8_w8a8_channel,torch.float16,256,96,5120,160,8,0,0,asm,10002+20001,321.8684
gfx936,int8_w8a8_channel,torch.float16,320,96,5120,160,8,0,0,asm,11004+21001,347.6705
gfx936,int8_w8a8_channel,torch.float16,384,96,5120,160,8,0,0,asm,11005+21001,361.161
gfx936,int8_w8a8_channel,torch.float16,448,96,5120,160,8,0,0,asm,11005+21001,370.062
gfx936,int8_w8a8_channel,torch.float16,512,96,5120,160,8,0,0,asm,11003+21001,392.8317
gfx936,int8_w8a8_channel,torch.float16,640,96,5120,160,8,0,0,asm,11005+21001,449.4717
gfx936,int8_w8a8_channel,torch.float16,768,96,5120,160,8,0,0,asm,12001+22001,488.2422
gfx936,int8_w8a8_channel,torch.float16,896,96,5120,160,8,0,0,asm,12001+22001,513.1684
gfx936,int8_w8a8_channel,torch.float16,1024,96,5120,160,8,0,0,asm,12001+22001,536.2168
gfx936,int8_w8a8_channel,torch.float16,1280,96,5120,160,8,0,0,asm,12001+22001,650.3052
gfx936,int8_w8a8_channel,torch.float16,1536,96,5120,160,8,0,0,asm,12001+22001,783.265
gfx936,int8_w8a8_channel,torch.float16,2048,96,5120,160,8,0,0,asm,13001+23001,866.7007
gfx936,int8_w8a8_channel,torch.float16,2304,96,5120,160,8,0,0,asm,13001+23001,931.2733
gfx936,int8_w8a8_channel,torch.float16,2560,96,5120,160,8,0,0,asm,12001+22001,1096.5869
gfx936,int8_w8a8_channel,torch.float16,3072,96,5120,160,8,0,0,asm,12001+22001,1280.1487
gfx936,int8_w8a8_channel,torch.float16,3584,96,5120,160,8,0,0,asm,12001+22001,1389.3526
gfx936,int8_w8a8_channel,torch.float16,4096,96,5120,160,8,0,0,asm,13001+23001,1541.3777
gfx936,int8_w8a8_channel,torch.float16,5120,96,5120,160,8,0,0,asm,13001+23001,1930.5899
gfx936,int8_w8a8_channel,torch.float16,6144,96,5120,160,8,0,0,asm,13001+23001,2287.2296
gfx936,int8_w8a8_channel,torch.float16,7168,96,5120,160,8,0,0,asm,13001+23001,2472.2483
gfx936,int8_w8a8_channel,torch.float16,8192,96,5120,160,8,0,0,asm,13001+23001,2966.6731
gfx936,int8_w8a8_channel,torch.float16,10240,96,5120,160,8,0,0,asm,13001+23001,3557.0135
gfx936,int8_w8a8_channel,torch.float16,12288,96,5120,160,8,0,0,asm,13001+23001,4122.2256
gfx936,int8_w8a8_channel,torch.float16,16384,96,5120,160,8,0,0,asm,13001+23001,5528.9355
gfx936,int8_w8a8_channel,torch.float16,24576,96,5120,160,8,0,0,asm,13001+23001,8067.3382
gfx936,int8_w8a8_channel,torch.float16,32768,96,5120,160,8,0,0,asm,13001+23001,10613.811
gfx936,int8_w8a8_channel,torch.float16,1,192,4096,128,8,0,0,asm,10002+20000,45.8035
gfx936,int8_w8a8_channel,torch.float16,2,192,4096,128,8,0,0,asm,10002+20000,65.0792
gfx936,int8_w8a8_channel,torch.float16,4,192,4096,128,8,0,0,asm,10002+20000,93.0033
gfx936,int8_w8a8_channel,torch.float16,6,192,4096,128,8,0,0,asm,10001+20000,123.6391
gfx936,int8_w8a8_channel,torch.float16,8,192,4096,128,8,0,0,asm,10001+20000,151.7235
gfx936,int8_w8a8_channel,torch.float16,12,192,4096,128,8,0,0,asm,10002+20000,190.6369
gfx936,int8_w8a8_channel,torch.float16,16,192,4096,128,8,0,0,asm,10001+20001,224.3127
gfx936,int8_w8a8_channel,torch.float16,24,192,4096,128,8,0,0,asm,10002+20001,261.0761
gfx936,int8_w8a8_channel,torch.float16,32,192,4096,128,8,0,0,asm,10001+20001,280.3211
gfx936,int8_w8a8_channel,torch.float16,36,192,4096,128,8,0,0,asm,10002+20001,286.1538
gfx936,int8_w8a8_channel,torch.float16,48,192,4096,128,8,0,0,asm,10001+20001,311.2739
gfx936,int8_w8a8_channel,torch.float16,56,192,4096,128,8,0,0,asm,10001+20001,315.4338
gfx936,int8_w8a8_channel,torch.float16,64,192,4096,128,8,0,0,asm,10001+20001,330.0894
gfx936,int8_w8a8_channel,torch.float16,72,192,4096,128,8,0,0,asm,10001+20001,321.1854
gfx936,int8_w8a8_channel,torch.float16,80,192,4096,128,8,0,0,asm,10001+20001,323.7706
gfx936,int8_w8a8_channel,torch.float16,88,192,4096,128,8,0,0,asm,10002+20001,327.7454
gfx936,int8_w8a8_channel,torch.float16,96,192,4096,128,8,0,0,asm,10002+20000,331.2233
gfx936,int8_w8a8_channel,torch.float16,100,192,4096,128,8,0,0,asm,10002+20001,331.0465
gfx936,int8_w8a8_channel,torch.float16,112,192,4096,128,8,0,0,asm,10002+20001,335.5349
gfx936,int8_w8a8_channel,torch.float16,128,192,4096,128,8,0,0,asm,10002+20001,340.1243
gfx936,int8_w8a8_channel,torch.float16,144,192,4096,128,8,0,0,asm,10002+20001,344.5454
gfx936,int8_w8a8_channel,torch.float16,160,192,4096,128,8,0,0,asm,10002+20001,348.3854
gfx936,int8_w8a8_channel,torch.float16,192,192,4096,128,8,0,0,asm,10002+20001,359.7033
gfx936,int8_w8a8_channel,torch.float16,224,192,4096,128,8,0,0,asm,11006+21001,371.7958
gfx936,int8_w8a8_channel,torch.float16,256,192,4096,128,8,0,0,asm,11005+21001,377.3874
gfx936,int8_w8a8_channel,torch.float16,320,192,4096,128,8,0,0,asm,11004+21001,403.1727
gfx936,int8_w8a8_channel,torch.float16,384,192,4096,128,8,0,0,asm,11004+21001,412.6969
gfx936,int8_w8a8_channel,torch.float16,448,192,4096,128,8,0,0,asm,11005+21001,427.6864
gfx936,int8_w8a8_channel,torch.float16,512,192,4096,128,8,0,0,asm,11005+21001,456.5368
gfx936,int8_w8a8_channel,torch.float16,640,192,4096,128,8,0,0,asm,12004+22001,481.2694
gfx936,int8_w8a8_channel,torch.float16,768,192,4096,128,8,0,0,asm,12001+22001,508.0230
gfx936,int8_w8a8_channel,torch.float16,896,192,4096,128,8,0,0,asm,12000+22001,552.1999
gfx936,int8_w8a8_channel,torch.float16,1024,192,4096,128,8,0,0,asm,12001+22001,606.8441
gfx936,int8_w8a8_channel,torch.float16,1280,192,4096,128,8,0,0,asm,13001+23001,697.2861
gfx936,int8_w8a8_channel,torch.float16,1536,192,4096,128,8,0,0,asm,13001+23001,738.6249
gfx936,int8_w8a8_channel,torch.float16,2048,192,4096,128,8,0,0,asm,13001+23001,959.1636
gfx936,int8_w8a8_channel,torch.float16,2304,192,4096,128,8,0,0,asm,12000+22001,1102.2878
gfx936,int8_w8a8_channel,torch.float16,2560,192,4096,128,8,0,0,asm,12000+22001,1152.1824
gfx936,int8_w8a8_channel,torch.float16,3072,192,4096,128,8,0,0,asm,13001+23001,1294.9864
gfx936,int8_w8a8_channel,torch.float16,3584,192,4096,128,8,0,0,asm,13001+23001,1403.7105
gfx936,int8_w8a8_channel,torch.float16,4096,192,4096,128,8,0,0,asm,13001+23001,1613.2093
gfx936,int8_w8a8_channel,torch.float16,5120,192,4096,128,8,0,0,asm,13001+23001,1955.6931
gfx936,int8_w8a8_channel,torch.float16,6144,192,4096,128,8,0,0,asm,13001+23001,2323.5159
gfx936,int8_w8a8_channel,torch.float16,7168,192,4096,128,8,0,0,asm,13001+23001,2635.3051
gfx936,int8_w8a8_channel,torch.float16,8192,192,4096,128,8,0,0,asm,13001+23001,2953.2079
gfx936,int8_w8a8_channel,torch.float16,10240,192,4096,128,8,0,0,asm,13001+23001,3634.3272
gfx936,int8_w8a8_channel,torch.float16,12288,192,4096,128,8,0,0,asm,13001+23001,4299.6487
gfx936,int8_w8a8_channel,torch.float16,16384,192,4096,128,8,0,0,asm,13001+23001,5648.0011
gfx936,int8_w8a8_channel,torch.float16,24576,192,4096,128,8,0,0,asm,13001+23001,8335.2828
gfx936,int8_w8a8_channel,torch.float16,32768,192,4096,128,8,0,0,asm,13001+23001,11020.2319
gfx936,int8_w8a8_channel,torch.float16,1,96,4096,128,8,0,0,asm,10003+20001,38.1151
gfx936,int8_w8a8_channel,torch.float16,2,96,4096,128,8,0,0,asm,10002+20000,47.5549
gfx936,int8_w8a8_channel,torch.float16,4,96,4096,128,8,0,0,asm,10008+20001,66.3425
gfx936,int8_w8a8_channel,torch.float16,6,96,4096,128,8,0,0,asm,10011+20001,79.4709
gfx936,int8_w8a8_channel,torch.float16,8,96,4096,128,8,0,0,asm,10011+20001,95.3781
gfx936,int8_w8a8_channel,torch.float16,12,96,4096,128,8,0,0,asm,10001+20001,120.717
gfx936,int8_w8a8_channel,torch.float16,16,96,4096,128,8,0,0,asm,10001+20001,137.7275
gfx936,int8_w8a8_channel,torch.float16,24,96,4096,128,8,0,0,asm,10002+20001,154.5499
gfx936,int8_w8a8_channel,torch.float16,32,96,4096,128,8,0,0,asm,10011+20001,169.9718
gfx936,int8_w8a8_channel,torch.float16,36,96,4096,128,8,0,0,asm,10001+20001,170.0784
gfx936,int8_w8a8_channel,torch.float16,48,96,4096,128,8,0,0,asm,10002+20001,183.2321
gfx936,int8_w8a8_channel,torch.float16,56,96,4096,128,8,0,0,asm,10002+20001,185.6151
gfx936,int8_w8a8_channel,torch.float16,64,96,4096,128,8,0,0,asm,10013+20001,200.6075
gfx936,int8_w8a8_channel,torch.float16,72,96,4096,128,8,0,0,asm,10002+20001,188.1583
gfx936,int8_w8a8_channel,torch.float16,80,96,4096,128,8,0,0,asm,10002+20001,189.2614
gfx936,int8_w8a8_channel,torch.float16,88,96,4096,128,8,0,0,asm,10013+20001,192.1668
gfx936,int8_w8a8_channel,torch.float16,96,96,4096,128,8,0,0,asm,10002+20001,193.8594
gfx936,int8_w8a8_channel,torch.float16,100,96,4096,128,8,0,0,asm,10002+20001,195.5519
gfx936,int8_w8a8_channel,torch.float16,112,96,4096,128,8,0,0,asm,10002+20001,196.9414
gfx936,int8_w8a8_channel,torch.float16,128,96,4096,128,8,0,0,asm,10001+20001,198.7267
gfx936,int8_w8a8_channel,torch.float16,144,96,4096,128,8,0,0,asm,10002+20001,204.8403
gfx936,int8_w8a8_channel,torch.float16,160,96,4096,128,8,0,0,asm,10002+20001,208.2004
gfx936,int8_w8a8_channel,torch.float16,192,96,4096,128,8,0,0,asm,10002+20001,218.5918
gfx936,int8_w8a8_channel,torch.float16,224,96,4096,128,8,0,0,asm,11007+21001,226.6593
gfx936,int8_w8a8_channel,torch.float16,256,96,4096,128,8,0,0,asm,11007+21001,230.8277
gfx936,int8_w8a8_channel,torch.float16,320,96,4096,128,8,0,0,asm,11000+21001,257.3539
gfx936,int8_w8a8_channel,torch.float16,384,96,4096,128,8,0,0,asm,11004+21001,273.194
gfx936,int8_w8a8_channel,torch.float16,448,96,4096,128,8,0,0,asm,11004+21001,283.4255
gfx936,int8_w8a8_channel,torch.float16,512,96,4096,128,8,0,0,asm,11005+21001,300.8992
gfx936,int8_w8a8_channel,torch.float16,640,96,4096,128,8,0,0,asm,12005+22001,330.1791
gfx936,int8_w8a8_channel,torch.float16,768,96,4096,128,8,0,0,asm,12005+22001,348.8991
gfx936,int8_w8a8_channel,torch.float16,896,96,4096,128,8,0,0,asm,12000+22001,395.1896
gfx936,int8_w8a8_channel,torch.float16,1024,96,4096,128,8,0,0,asm,12001+22001,431.7875
gfx936,int8_w8a8_channel,torch.float16,1280,96,4096,128,8,0,0,asm,13001+23001,521.4631
gfx936,int8_w8a8_channel,torch.float16,1536,96,4096,128,8,0,0,asm,13001+23001,554.6757
gfx936,int8_w8a8_channel,torch.float16,2048,96,4096,128,8,0,0,asm,12001+22001,704.6884
gfx936,int8_w8a8_channel,torch.float16,2304,96,4096,128,8,0,0,asm,12001+22001,816.0986
gfx936,int8_w8a8_channel,torch.float16,2560,96,4096,128,8,0,0,asm,12001+22001,853.9596
gfx936,int8_w8a8_channel,torch.float16,3072,96,4096,128,8,0,0,asm,12005+22001,990.5068
gfx936,int8_w8a8_channel,torch.float16,3584,96,4096,128,8,0,0,asm,13001+23001,1099.4415
gfx936,int8_w8a8_channel,torch.float16,4096,96,4096,128,8,0,0,asm,13001+23001,1252.3592
gfx936,int8_w8a8_channel,torch.float16,5120,96,4096,128,8,0,0,asm,13001+23001,1523.34
gfx936,int8_w8a8_channel,torch.float16,6144,96,4096,128,8,0,0,asm,13001+23001,1819.7692
gfx936,int8_w8a8_channel,torch.float16,7168,96,4096,128,8,0,0,asm,13001+23001,2057.79
gfx936,int8_w8a8_channel,torch.float16,8192,96,4096,128,8,0,0,asm,13001+23001,2314.2613
gfx936,int8_w8a8_channel,torch.float16,10240,96,4096,128,8,0,0,asm,13001+23001,2847.3472
gfx936,int8_w8a8_channel,torch.float16,12288,96,4096,128,8,0,0,asm,13001+23001,3375.0267
gfx936,int8_w8a8_channel,torch.float16,16384,96,4096,128,8,0,0,asm,13001+23001,4440.3141
gfx936,int8_w8a8_channel,torch.float16,24576,96,4096,128,8,0,0,asm,13001+23001,6558.0723
gfx936,int8_w8a8_channel,torch.float16,32768,96,4096,128,8,0,0,asm,13001+23001,8674.584
gfx936,int8_w8a8_channel,torch.float16,1,256,3072,256,8,0,0,asm,10002+20000,48.3972
gfx936,int8_w8a8_channel,torch.float16,2,256,3072,256,8,0,0,asm,10002+20000,66.0139
gfx936,int8_w8a8_channel,torch.float16,4,256,3072,256,8,0,0,asm,10013+20000,98.4014
gfx936,int8_w8a8_channel,torch.float16,6,256,3072,256,8,0,0,asm,10002+20000,129.3739
gfx936,int8_w8a8_channel,torch.float16,8,256,3072,256,8,0,0,asm,10013+20000,156.3802
gfx936,int8_w8a8_channel,torch.float16,12,256,3072,256,8,0,0,asm,10002+20000,205.3233
gfx936,int8_w8a8_channel,torch.float16,16,256,3072,256,8,0,0,asm,10002+20001,248.0685
gfx936,int8_w8a8_channel,torch.float16,24,256,3072,256,8,0,0,asm,10002+20001,320.0738
gfx936,int8_w8a8_channel,torch.float16,32,256,3072,256,8,0,0,asm,10002+20001,392.4726
gfx936,int8_w8a8_channel,torch.float16,36,256,3072,256,8,0,0,asm,10002+20001,402.2885
gfx936,int8_w8a8_channel,torch.float16,48,256,3072,256,8,0,0,asm,10002+20001,450.5242
gfx936,int8_w8a8_channel,torch.float16,56,256,3072,256,8,0,0,asm,10002+20000,474.7179
gfx936,int8_w8a8_channel,torch.float16,64,256,3072,256,8,0,0,asm,10002+20001,492.7474
gfx936,int8_w8a8_channel,torch.float16,72,256,3072,256,8,0,0,asm,10002+20000,510.5494
gfx936,int8_w8a8_channel,torch.float16,80,256,3072,256,8,0,0,asm,10002+20001,527.6442
gfx936,int8_w8a8_channel,torch.float16,88,256,3072,256,8,0,0,asm,10002+20001,544.7388
gfx936,int8_w8a8_channel,torch.float16,96,256,3072,256,8,0,0,asm,10002+20001,551.7368
gfx936,int8_w8a8_channel,torch.float16,100,256,3072,256,8,0,0,asm,10002+20000,552.4694
gfx936,int8_w8a8_channel,torch.float16,112,256,3072,256,8,0,0,asm,10002+20001,563.6272
gfx936,int8_w8a8_channel,torch.float16,128,256,3072,256,8,0,0,asm,10002+20000,578.1029
gfx936,int8_w8a8_channel,torch.float16,144,256,3072,256,8,0,0,asm,10002+20001,586.8777
gfx936,int8_w8a8_channel,torch.float16,160,256,3072,256,8,0,0,asm,10002+20001,592.4525
gfx936,int8_w8a8_channel,torch.float16,192,256,3072,256,8,0,0,asm,10002+20001,604.444
gfx936,int8_w8a8_channel,torch.float16,224,256,3072,256,8,0,0,asm,10002+20001,615.3409
gfx936,int8_w8a8_channel,torch.float16,256,256,3072,256,8,0,0,asm,10002+20001,623.1893
gfx936,int8_w8a8_channel,torch.float16,320,256,3072,256,8,0,0,asm,10002+20001,639.0377
gfx936,int8_w8a8_channel,torch.float16,384,256,3072,256,8,0,0,asm,11007+21001,657.9093
gfx936,int8_w8a8_channel,torch.float16,448,256,3072,256,8,0,0,asm,11007+21001,668.823
gfx936,int8_w8a8_channel,torch.float16,512,256,3072,256,8,0,0,asm,11007+21001,686.1451
gfx936,int8_w8a8_channel,torch.float16,640,256,3072,256,8,0,0,asm,11007+21001,719.2651
gfx936,int8_w8a8_channel,torch.float16,768,256,3072,256,8,0,0,asm,11007+21001,742.8187
gfx936,int8_w8a8_channel,torch.float16,896,256,3072,256,8,0,0,asm,11007+21001,765.7492
gfx936,int8_w8a8_channel,torch.float16,1024,256,3072,256,8,0,0,asm,11005+21001,805.9598
gfx936,int8_w8a8_channel,torch.float16,1280,256,3072,256,8,0,0,asm,12005+22001,861.6987
gfx936,int8_w8a8_channel,torch.float16,1536,256,3072,256,8,0,0,asm,12005+22001,920.4859
gfx936,int8_w8a8_channel,torch.float16,2048,256,3072,256,8,0,0,asm,12005+22001,1047.6522
gfx936,int8_w8a8_channel,torch.float16,2304,256,3072,256,8,0,0,asm,13001+23001,1113.9763
gfx936,int8_w8a8_channel,torch.float16,2560,256,3072,256,8,0,0,asm,13001+23001,1148.7468
gfx936,int8_w8a8_channel,torch.float16,3072,256,3072,256,8,0,0,asm,13001+23001,1226.7341
gfx936,int8_w8a8_channel,torch.float16,3584,256,3072,256,8,0,0,asm,13001+23001,1336.0982
gfx936,int8_w8a8_channel,torch.float16,4096,256,3072,256,8,0,0,asm,13001+23001,1522.7002
gfx936,int8_w8a8_channel,torch.float16,5120,256,3072,256,8,0,0,asm,12001+22001,1872.0472
gfx936,int8_w8a8_channel,torch.float16,6144,256,3072,256,8,0,0,asm,13001+23001,2030.5648
gfx936,int8_w8a8_channel,torch.float16,7168,256,3072,256,8,0,0,asm,13001+23001,2183.6848
gfx936,int8_w8a8_channel,torch.float16,8192,256,3072,256,8,0,0,asm,13001+23001,2521.495
gfx936,int8_w8a8_channel,torch.float16,10240,256,3072,256,8,0,0,asm,13001+23001,3044.9724
gfx936,int8_w8a8_channel,torch.float16,12288,256,3072,256,8,0,0,asm,13001+23001,3573.7635
gfx936,int8_w8a8_channel,torch.float16,16384,256,3072,256,8,0,0,asm,13001+23001,4611.2867
gfx936,int8_w8a8_channel,torch.float16,24576,256,3072,256,8,0,0,asm,13001+23001,6740.9099
gfx936,int8_w8a8_channel,torch.float16,32768,256,3072,256,8,0,0,asm,13001+23001,8835.3837
gfx936,int8_w8a8_channel,torch.float16,1,128,3072,256,8,0,0,asm,10004+20000,44.4477
gfx936,int8_w8a8_channel,torch.float16,2,128,3072,256,8,0,0,asm,10002+20100,52.7761
gfx936,int8_w8a8_channel,torch.float16,4,128,3072,256,8,0,0,asm,10002+20102,69.7361
gfx936,int8_w8a8_channel,torch.float16,6,128,3072,256,8,0,0,asm,10002+20102,87.2939
gfx936,int8_w8a8_channel,torch.float16,8,128,3072,256,8,0,0,asm,10010+20102,101.1886
gfx936,int8_w8a8_channel,torch.float16,12,128,3072,256,8,0,0,asm,10002+20001,131.2096
gfx936,int8_w8a8_channel,torch.float16,16,128,3072,256,8,0,0,asm,10002+20001,153.9296
gfx936,int8_w8a8_channel,torch.float16,24,128,3072,256,8,0,0,asm,10002+20001,187.5521
gfx936,int8_w8a8_channel,torch.float16,32,128,3072,256,8,0,0,asm,10002+20001,232.5991
gfx936,int8_w8a8_channel,torch.float16,36,128,3072,256,8,0,0,asm,10002+20001,227.4087
gfx936,int8_w8a8_channel,torch.float16,48,128,3072,256,8,0,0,asm,10002+20001,253.9349
gfx936,int8_w8a8_channel,torch.float16,56,128,3072,256,8,0,0,asm,10002+20001,266.7097
gfx936,int8_w8a8_channel,torch.float16,64,128,3072,256,8,0,0,asm,10002+20001,279.2823
gfx936,int8_w8a8_channel,torch.float16,72,128,3072,256,8,0,0,asm,10002+20001,286.6423
gfx936,int8_w8a8_channel,torch.float16,80,128,3072,256,8,0,0,asm,10002+20001,296.7054
gfx936,int8_w8a8_channel,torch.float16,88,128,3072,256,8,0,0,asm,10002+20001,303.0211
gfx936,int8_w8a8_channel,torch.float16,96,128,3072,256,8,0,0,asm,10002+20001,310.4316
gfx936,int8_w8a8_channel,torch.float16,100,128,3072,256,8,0,0,asm,10002+20001,308.5117
gfx936,int8_w8a8_channel,torch.float16,112,128,3072,256,8,0,0,asm,10002+20001,314.5159
gfx936,int8_w8a8_channel,torch.float16,128,128,3072,256,8,0,0,asm,10002+20001,323.198
gfx936,int8_w8a8_channel,torch.float16,144,128,3072,256,8,0,0,asm,10002+20001,326.8106
gfx936,int8_w8a8_channel,torch.float16,160,128,3072,256,8,0,0,asm,10002+20001,332.4781
gfx936,int8_w8a8_channel,torch.float16,192,128,3072,256,8,0,0,asm,10002+20001,333.9349
gfx936,int8_w8a8_channel,torch.float16,224,128,3072,256,8,0,0,asm,10013+20001,342.6423
gfx936,int8_w8a8_channel,torch.float16,256,128,3072,256,8,0,0,asm,10002+20001,344.8234
gfx936,int8_w8a8_channel,torch.float16,320,128,3072,256,8,0,0,asm,10002+20001,355.7706
gfx936,int8_w8a8_channel,torch.float16,384,128,3072,256,8,0,0,asm,10002+20001,372.5369
gfx936,int8_w8a8_channel,torch.float16,448,128,3072,256,8,0,0,asm,11007+21001,379.2065
gfx936,int8_w8a8_channel,torch.float16,512,128,3072,256,8,0,0,asm,11007+21001,395.7538
gfx936,int8_w8a8_channel,torch.float16,640,128,3072,256,8,0,0,asm,11004+21001,416.5117
gfx936,int8_w8a8_channel,torch.float16,768,128,3072,256,8,0,0,asm,11007+21001,439.7537
gfx936,int8_w8a8_channel,torch.float16,896,128,3072,256,8,0,0,asm,11007+21001,443.0296
gfx936,int8_w8a8_channel,torch.float16,1024,128,3072,256,8,0,0,asm,11005+21001,475.6358
gfx936,int8_w8a8_channel,torch.float16,1280,128,3072,256,8,0,0,asm,12005+22001,515.2147
gfx936,int8_w8a8_channel,torch.float16,1536,128,3072,256,8,0,0,asm,12005+22001,567.0547
gfx936,int8_w8a8_channel,torch.float16,2048,128,3072,256,8,0,0,asm,12005+22001,659.6858
gfx936,int8_w8a8_channel,torch.float16,2304,128,3072,256,8,0,0,asm,12001+21102,742.3382
gfx936,int8_w8a8_channel,torch.float16,2560,128,3072,256,8,0,0,asm,12001+21102,780.6539
gfx936,int8_w8a8_channel,torch.float16,3072,128,3072,256,8,0,0,asm,13001+23001,824.0141
gfx936,int8_w8a8_channel,torch.float16,3584,128,3072,256,8,0,0,asm,13001+23001,908.1319
gfx936,int8_w8a8_channel,torch.float16,4096,128,3072,256,8,0,0,asm,12001+22001,1038.8349
gfx936,int8_w8a8_channel,torch.float16,5120,128,3072,256,8,0,0,asm,12001+22001,1267.7605
gfx936,int8_w8a8_channel,torch.float16,6144,128,3072,256,8,0,0,asm,13001+23001,1429.2759
gfx936,int8_w8a8_channel,torch.float16,7168,128,3072,256,8,0,0,asm,13001+23001,1555.8024
gfx936,int8_w8a8_channel,torch.float16,8192,128,3072,256,8,0,0,asm,13001+23001,1789.4696
gfx936,int8_w8a8_channel,torch.float16,10240,128,3072,256,8,0,0,asm,13001+23001,2165.9155
gfx936,int8_w8a8_channel,torch.float16,12288,128,3072,256,8,0,0,asm,13001+23001,2530.2763
gfx936,int8_w8a8_channel,torch.float16,16384,128,3072,256,8,0,0,asm,13001+23001,3264.3642
gfx936,int8_w8a8_channel,torch.float16,24576,128,3072,256,8,0,0,asm,13001+23001,4759.7737
gfx936,int8_w8a8_channel,torch.float16,32768,128,3072,256,8,0,0,asm,13001+23001,6279.1322
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,int8_w8a8_channel,torch.float16,1,128,7168,256,8,0,0,asm,10003+20100,60.7153
gfx936,int8_w8a8_channel,torch.float16,2,128,7168,256,8,0,0,asm,10002+20102,77.9869
gfx936,int8_w8a8_channel,torch.float16,3,128,7168,256,8,0,0,asm,10009+20102,92.7455
gfx936,int8_w8a8_channel,torch.float16,4,128,7168,256,8,0,0,asm,10010+20102,110.4505
gfx936,int8_w8a8_channel,torch.float16,5,128,7168,256,8,0,0,asm,10006+20102,133.0372
gfx936,int8_w8a8_channel,torch.float16,6,128,7168,256,8,0,0,asm,10005+20102,155.6895
gfx936,int8_w8a8_channel,torch.float16,7,128,7168,256,8,0,0,asm,10001+20102,165.0761
gfx936,int8_w8a8_channel,torch.float16,8,128,7168,256,8,0,0,asm,10005+20102,175.591
gfx936,int8_w8a8_channel,torch.float16,9,128,7168,256,8,0,0,asm,10001+20102,188.4515
gfx936,int8_w8a8_channel,torch.float16,10,128,7168,256,8,0,0,asm,10001+20102,202.0567
gfx936,int8_w8a8_channel,torch.float16,11,128,7168,256,8,0,0,asm,10001+20102,216.0628
gfx936,int8_w8a8_channel,torch.float16,12,128,7168,256,8,0,0,asm,10001+20102,227.7442
gfx936,int8_w8a8_channel,torch.float16,13,128,7168,256,8,0,0,asm,10001+20102,241.5275
gfx936,int8_w8a8_channel,torch.float16,14,128,7168,256,8,0,0,asm,10004+20102,254.7253
gfx936,int8_w8a8_channel,torch.float16,15,128,7168,256,8,0,0,asm,10005+20102,261.3183
gfx936,int8_w8a8_channel,torch.float16,16,128,7168,256,8,0,0,asm,10001+20102,266.8521
gfx936,int8_w8a8_channel,torch.float16,17,128,7168,256,8,0,0,asm,10001+20102,268.9418
gfx936,int8_w8a8_channel,torch.float16,18,128,7168,256,8,0,0,asm,10001+20102,279.5306
gfx936,int8_w8a8_channel,torch.float16,20,128,7168,256,8,0,0,asm,10001+20102,304.5974
gfx936,int8_w8a8_channel,torch.float16,24,128,7168,256,8,0,0,asm,10001+20102,347.4364
gfx936,int8_w8a8_channel,torch.float16,28,128,7168,256,8,0,0,asm,10001+20102,394.1512
gfx936,int8_w8a8_channel,torch.float16,32,128,7168,256,8,0,0,asm,10001+20001,420.4774
gfx936,int8_w8a8_channel,torch.float16,34,128,7168,256,8,0,0,asm,10004+20001,423.2036
gfx936,int8_w8a8_channel,torch.float16,36,128,7168,256,8,0,0,asm,10001+20001,436.3232
gfx936,int8_w8a8_channel,torch.float16,40,128,7168,256,8,0,0,asm,10001+20102,452.7313
gfx936,int8_w8a8_channel,torch.float16,44,128,7168,256,8,0,0,asm,10000+20001,472.2898
gfx936,int8_w8a8_channel,torch.float16,48,128,7168,256,8,0,0,asm,10000+20001,484.0682
gfx936,int8_w8a8_channel,torch.float16,56,128,7168,256,8,0,0,asm,10001+20001,510.1813
gfx936,int8_w8a8_channel,torch.float16,64,128,7168,256,8,0,0,asm,10001+20001,530.0211
gfx936,int8_w8a8_channel,torch.float16,68,128,7168,256,8,0,0,asm,10000+20001,534.858
gfx936,int8_w8a8_channel,torch.float16,72,128,7168,256,8,0,0,asm,10000+20001,547.338
gfx936,int8_w8a8_channel,torch.float16,80,128,7168,256,8,0,0,asm,10000+20001,563.2076
gfx936,int8_w8a8_channel,torch.float16,88,128,7168,256,8,0,0,asm,10000+20001,582.2851
gfx936,int8_w8a8_channel,torch.float16,96,128,7168,256,8,0,0,asm,10000+20001,587.5819
gfx936,int8_w8a8_channel,torch.float16,104,128,7168,256,8,0,0,asm,10000+20001,593.8242
gfx936,int8_w8a8_channel,torch.float16,112,128,7168,256,8,0,0,asm,10001+20001,603.3377
gfx936,int8_w8a8_channel,torch.float16,128,128,7168,256,8,0,0,asm,10000+20001,617.634
gfx936,int8_w8a8_channel,torch.float16,144,128,7168,256,8,0,0,asm,10000+20001,630.7514
gfx936,int8_w8a8_channel,torch.float16,160,128,7168,256,8,0,0,asm,10000+20001,639.4196
gfx936,int8_w8a8_channel,torch.float16,192,128,7168,256,8,0,0,asm,10000+20001,654.4355
gfx936,int8_w8a8_channel,torch.float16,224,128,7168,256,8,0,0,asm,10000+20001,668.7697
gfx936,int8_w8a8_channel,torch.float16,256,128,7168,256,8,0,0,asm,10000+20001,679.4586
gfx936,int8_w8a8_channel,torch.float16,320,128,7168,256,8,0,0,asm,10001+20001,712.4597
gfx936,int8_w8a8_channel,torch.float16,384,128,7168,256,8,0,0,asm,10002+20001,737.9884
gfx936,int8_w8a8_channel,torch.float16,448,128,7168,256,8,0,0,asm,10002+20102,773.0358
gfx936,int8_w8a8_channel,torch.float16,512,128,7168,256,8,0,0,asm,10006+20102,791.3841
gfx936,int8_w8a8_channel,torch.float16,576,128,7168,256,8,0,0,asm,11000+21001,818.8247
gfx936,int8_w8a8_channel,torch.float16,640,128,7168,256,8,0,0,asm,11000+21001,836.441
gfx936,int8_w8a8_channel,torch.float16,704,128,7168,256,8,0,0,asm,11000+21001,862.0874
gfx936,int8_w8a8_channel,torch.float16,768,128,7168,256,8,0,0,asm,11006+21001,885.7409
gfx936,int8_w8a8_channel,torch.float16,832,128,7168,256,8,0,0,asm,11006+21001,914.526
gfx936,int8_w8a8_channel,torch.float16,896,128,7168,256,8,0,0,asm,11006+21001,933.0011
gfx936,int8_w8a8_channel,torch.float16,960,128,7168,256,8,0,0,asm,11006+21001,952.168
gfx936,int8_w8a8_channel,torch.float16,1024,128,7168,256,8,0,0,asm,11006+21001,976.3539
gfx936,int8_w8a8_channel,torch.float16,1152,128,7168,256,8,0,0,asm,11007+21001,1038.3866
gfx936,int8_w8a8_channel,torch.float16,1280,128,7168,256,8,0,0,asm,12004+22001,1072.8371
gfx936,int8_w8a8_channel,torch.float16,1408,128,7168,256,8,0,0,asm,12004+22001,1114.2061
gfx936,int8_w8a8_channel,torch.float16,1536,128,7168,256,8,0,0,asm,12004+22001,1147.3019
gfx936,int8_w8a8_channel,torch.float16,1664,128,7168,256,8,0,0,asm,12004+22001,1188.4794
gfx936,int8_w8a8_channel,torch.float16,1792,128,7168,256,8,0,0,asm,11007+21001,1272.1697
gfx936,int8_w8a8_channel,torch.float16,1920,128,7168,256,8,0,0,asm,12004+22001,1314.1846
gfx936,int8_w8a8_channel,torch.float16,2048,128,7168,256,8,0,0,asm,12004+22001,1393.276
gfx936,int8_w8a8_channel,torch.float16,2304,128,7168,256,8,0,0,asm,12005+22001,1509.9256
gfx936,int8_w8a8_channel,torch.float16,2560,128,7168,256,8,0,0,asm,12005+22001,1624.4163
gfx936,int8_w8a8_channel,torch.float16,2816,128,7168,256,8,0,0,asm,12005+22001,1691.4089
gfx936,int8_w8a8_channel,torch.float16,3072,128,7168,256,8,0,0,asm,13000+23001,1756.3363
gfx936,int8_w8a8_channel,torch.float16,3328,128,7168,256,8,0,0,asm,13000+23001,1796.1869
gfx936,int8_w8a8_channel,torch.float16,3584,128,7168,256,8,0,0,asm,12005+22001,1918.564
gfx936,int8_w8a8_channel,torch.float16,3840,128,7168,256,8,0,0,asm,12005+22001,2043.4429
gfx936,int8_w8a8_channel,torch.float16,4096,128,7168,256,8,0,0,asm,12005+22001,2154.6243
gfx936,int8_w8a8_channel,torch.float16,4608,128,7168,256,8,0,0,asm,12005+22001,2425.8021
gfx936,int8_w8a8_channel,torch.float16,5120,128,7168,256,8,0,0,asm,12001+22001,2591.2525
gfx936,int8_w8a8_channel,torch.float16,5632,128,7168,256,8,0,0,asm,12005+22001,2774.3757
gfx936,int8_w8a8_channel,torch.float16,6144,128,7168,256,8,0,0,asm,13001+23001,3007.5207
gfx936,int8_w8a8_channel,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23001,3109.7569
gfx936,int8_w8a8_channel,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23001,3259.6305
gfx936,int8_w8a8_channel,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23001,3473.4205
gfx936,int8_w8a8_channel,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23001,3792.1285
gfx936,int8_w8a8_channel,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23001,4587.977
gfx936,int8_w8a8_channel,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23001,5386.7393
gfx936,int8_w8a8_channel,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23001,6132.057
gfx936,int8_w8a8_channel,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23001,6980.8374
gfx936,int8_w8a8_channel,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23001,7425.3098
gfx936,int8_w8a8_channel,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23001,10095.1451
gfx936,int8_w8a8_channel,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23001,13283.6878
gfx936,int8_w8a8_channel,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15384.0472
gfx936,int8_w8a8_channel,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23101,19007.0848
gfx936,int8_w8a8_channel,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23001,22780.6062
gfx936,int8_w8a8_channel,torch.float16,1,256,7168,256,8,0,0,asm,10002+20001,75.0987
gfx936,int8_w8a8_channel,torch.float16,2,256,7168,256,8,0,0,asm,10010+20001,112.2721
gfx936,int8_w8a8_channel,torch.float16,3,256,7168,256,8,0,0,asm,10007+20001,152.3008
gfx936,int8_w8a8_channel,torch.float16,4,256,7168,256,8,0,0,asm,10004+20001,192.0999
gfx936,int8_w8a8_channel,torch.float16,5,256,7168,256,8,0,0,asm,10001+20001,217.7121
gfx936,int8_w8a8_channel,torch.float16,6,256,7168,256,8,0,0,asm,10004+20001,245.6376
gfx936,int8_w8a8_channel,torch.float16,7,256,7168,256,8,0,0,asm,10001+20001,273.5973
gfx936,int8_w8a8_channel,torch.float16,8,256,7168,256,8,0,0,asm,10001+20001,294.147
gfx936,int8_w8a8_channel,torch.float16,9,256,7168,256,8,0,0,asm,10005+20001,320.9195
gfx936,int8_w8a8_channel,torch.float16,10,256,7168,256,8,0,0,asm,10001+20001,344.6414
gfx936,int8_w8a8_channel,torch.float16,11,256,7168,256,8,0,0,asm,10001+20001,367.9973
gfx936,int8_w8a8_channel,torch.float16,12,256,7168,256,8,0,0,asm,10001+20001,384.5183
gfx936,int8_w8a8_channel,torch.float16,13,256,7168,256,8,0,0,asm,10001+20001,404.5027
gfx936,int8_w8a8_channel,torch.float16,14,256,7168,256,8,0,0,asm,10001+20001,432.7809
gfx936,int8_w8a8_channel,torch.float16,15,256,7168,256,8,0,0,asm,10001+20001,449.9427
gfx936,int8_w8a8_channel,torch.float16,16,256,7168,256,8,0,0,asm,10001+20001,461.8845
gfx936,int8_w8a8_channel,torch.float16,17,256,7168,256,8,0,0,asm,10001+20001,474.664
gfx936,int8_w8a8_channel,torch.float16,18,256,7168,256,8,0,0,asm,10001+20001,494.5292
gfx936,int8_w8a8_channel,torch.float16,20,256,7168,256,8,0,0,asm,10001+20001,535.7401
gfx936,int8_w8a8_channel,torch.float16,24,256,7168,256,8,0,0,asm,10001+20001,613.1227
gfx936,int8_w8a8_channel,torch.float16,28,256,7168,256,8,0,0,asm,10001+20001,697.9555
gfx936,int8_w8a8_channel,torch.float16,32,256,7168,256,8,0,0,asm,10001+20001,745.6344
gfx936,int8_w8a8_channel,torch.float16,34,256,7168,256,8,0,0,asm,10000+20001,756.038
gfx936,int8_w8a8_channel,torch.float16,36,256,7168,256,8,0,0,asm,10001+20001,784.6725
gfx936,int8_w8a8_channel,torch.float16,40,256,7168,256,8,0,0,asm,10000+20001,815.961
gfx936,int8_w8a8_channel,torch.float16,44,256,7168,256,8,0,0,asm,10000+20001,853.4527
gfx936,int8_w8a8_channel,torch.float16,48,256,7168,256,8,0,0,asm,10000+20001,874.2259
gfx936,int8_w8a8_channel,torch.float16,56,256,7168,256,8,0,0,asm,10000+20001,920.5861
gfx936,int8_w8a8_channel,torch.float16,64,256,7168,256,8,0,0,asm,10000+20001,957.2705
gfx936,int8_w8a8_channel,torch.float16,68,256,7168,256,8,0,0,asm,10000+20001,966.4684
gfx936,int8_w8a8_channel,torch.float16,72,256,7168,256,8,0,0,asm,10000+20001,993.4945
gfx936,int8_w8a8_channel,torch.float16,80,256,7168,256,8,0,0,asm,10000+20001,1024.3243
gfx936,int8_w8a8_channel,torch.float16,88,256,7168,256,8,0,0,asm,10000+20001,1060.0685
gfx936,int8_w8a8_channel,torch.float16,96,256,7168,256,8,0,0,asm,10000+20001,1075.8352
gfx936,int8_w8a8_channel,torch.float16,104,256,7168,256,8,0,0,asm,10000+20001,1088.9588
gfx936,int8_w8a8_channel,torch.float16,112,256,7168,256,8,0,0,asm,10000+20001,1100.0135
gfx936,int8_w8a8_channel,torch.float16,128,256,7168,256,8,0,0,asm,10000+20001,1124.4242
gfx936,int8_w8a8_channel,torch.float16,144,256,7168,256,8,0,0,asm,12004+22001,1140.4953
gfx936,int8_w8a8_channel,torch.float16,160,256,7168,256,8,0,0,asm,12004+22001,1153.8942
gfx936,int8_w8a8_channel,torch.float16,192,256,7168,256,8,0,0,asm,12004+22001,1170.6655
gfx936,int8_w8a8_channel,torch.float16,224,256,7168,256,8,0,0,asm,12004+22001,1176.2023
gfx936,int8_w8a8_channel,torch.float16,256,256,7168,256,8,0,0,asm,12004+22001,1188.1461
gfx936,int8_w8a8_channel,torch.float16,320,256,7168,256,8,0,0,asm,12004+22001,1215.3141
gfx936,int8_w8a8_channel,torch.float16,384,256,7168,256,8,0,0,asm,12004+22001,1230.5589
gfx936,int8_w8a8_channel,torch.float16,448,256,7168,256,8,0,0,asm,12004+22001,1253.6801
gfx936,int8_w8a8_channel,torch.float16,512,256,7168,256,8,0,0,asm,12004+22001,1274.6525
gfx936,int8_w8a8_channel,torch.float16,576,256,7168,256,8,0,0,asm,12004+22001,1303.6342
gfx936,int8_w8a8_channel,torch.float16,640,256,7168,256,8,0,0,asm,12004+22001,1324.7529
gfx936,int8_w8a8_channel,torch.float16,704,256,7168,256,8,0,0,asm,12004+22001,1346.4485
gfx936,int8_w8a8_channel,torch.float16,768,256,7168,256,8,0,0,asm,12004+22001,1371.3286
gfx936,int8_w8a8_channel,torch.float16,832,256,7168,256,8,0,0,asm,12004+22001,1381.5703
gfx936,int8_w8a8_channel,torch.float16,896,256,7168,256,8,0,0,asm,12004+22001,1413.5563
gfx936,int8_w8a8_channel,torch.float16,960,256,7168,256,8,0,0,asm,12004+22001,1426.0749
gfx936,int8_w8a8_channel,torch.float16,1024,256,7168,256,8,0,0,asm,12004+22001,1459.5109
gfx936,int8_w8a8_channel,torch.float16,1152,256,7168,256,8,0,0,asm,12004+22001,1489.2666
gfx936,int8_w8a8_channel,torch.float16,1280,256,7168,256,8,0,0,asm,12004+22001,1551.0266
gfx936,int8_w8a8_channel,torch.float16,1408,256,7168,256,8,0,0,asm,12004+22001,1581.6204
gfx936,int8_w8a8_channel,torch.float16,1536,256,7168,256,8,0,0,asm,12004+22001,1624.9426
gfx936,int8_w8a8_channel,torch.float16,1664,256,7168,256,8,0,0,asm,12004+22001,1673.3162
gfx936,int8_w8a8_channel,torch.float16,1792,256,7168,256,8,0,0,asm,12004+22001,1750.1469
gfx936,int8_w8a8_channel,torch.float16,1920,256,7168,256,8,0,0,asm,12004+22001,1815.5911
gfx936,int8_w8a8_channel,torch.float16,2048,256,7168,256,8,0,0,asm,12004+22001,1913.0902
gfx936,int8_w8a8_channel,torch.float16,2304,256,7168,256,8,0,0,asm,12005+22001,2068.4439
gfx936,int8_w8a8_channel,torch.float16,2560,256,7168,256,8,0,0,asm,12005+22001,2179.9266
gfx936,int8_w8a8_channel,torch.float16,2816,256,7168,256,8,0,0,asm,12005+22001,2261.0226
gfx936,int8_w8a8_channel,torch.float16,3072,256,7168,256,8,0,0,asm,12005+22001,2341.2846
gfx936,int8_w8a8_channel,torch.float16,3328,256,7168,256,8,0,0,asm,12005+22001,2433.3414
gfx936,int8_w8a8_channel,torch.float16,3584,256,7168,256,8,0,0,asm,12005+22001,2551.62
gfx936,int8_w8a8_channel,torch.float16,3840,256,7168,256,8,0,0,asm,12005+22001,2685.2969
gfx936,int8_w8a8_channel,torch.float16,4096,256,7168,256,8,0,0,asm,12005+22001,2888.1218
gfx936,int8_w8a8_channel,torch.float16,4608,256,7168,256,8,0,0,asm,12005+22001,3288.5242
gfx936,int8_w8a8_channel,torch.float16,5120,256,7168,256,8,0,0,asm,12001+22001,3496.5502
gfx936,int8_w8a8_channel,torch.float16,5632,256,7168,256,8,0,0,asm,12005+22001,3709.4328
gfx936,int8_w8a8_channel,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23001,3861.1458
gfx936,int8_w8a8_channel,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23001,3971.802
gfx936,int8_w8a8_channel,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23001,4122.667
gfx936,int8_w8a8_channel,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23001,4365.1053
gfx936,int8_w8a8_channel,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23001,4820.6556
gfx936,int8_w8a8_channel,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23001,5935.9992
gfx936,int8_w8a8_channel,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23001,6847.5073
gfx936,int8_w8a8_channel,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23001,7958.7381
gfx936,int8_w8a8_channel,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23001,8817.8405
gfx936,int8_w8a8_channel,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23001,9465.1795
gfx936,int8_w8a8_channel,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23001,12940.1163
gfx936,int8_w8a8_channel,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23001,17049.7543
gfx936,int8_w8a8_channel,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23001,21102.088
gfx936,int8_w8a8_channel,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23001,25129.0387
gfx938,int8_w8a8_channel,torch.float16,1,128,7168,256,8,0,0,asm,10000+20101,61.5548
gfx938,int8_w8a8_channel,torch.float16,2,128,7168,256,8,0,0,asm,10006+20102,76.2512
gfx938,int8_w8a8_channel,torch.float16,3,128,7168,256,8,0,0,asm,10008+20102,83.7998
gfx938,int8_w8a8_channel,torch.float16,4,128,7168,256,8,0,0,asm,10008+20102,102.0971
gfx938,int8_w8a8_channel,torch.float16,5,128,7168,256,8,0,0,asm,10011+20102,125.0755
gfx938,int8_w8a8_channel,torch.float16,6,128,7168,256,8,0,0,asm,10011+20102,130.7657
gfx938,int8_w8a8_channel,torch.float16,7,128,7168,256,8,0,0,asm,10011+20102,138.7698
gfx938,int8_w8a8_channel,torch.float16,8,128,7168,256,8,0,0,asm,10011+20102,143.9185
gfx938,int8_w8a8_channel,torch.float16,9,128,7168,256,8,0,0,asm,10008+20102,156.7554
gfx938,int8_w8a8_channel,torch.float16,10,128,7168,256,8,0,0,asm,10008+20102,169.7235
gfx938,int8_w8a8_channel,torch.float16,11,128,7168,256,8,0,0,asm,10007+20102,196.9235
gfx938,int8_w8a8_channel,torch.float16,12,128,7168,256,8,0,0,asm,10006+20102,197.9408
gfx938,int8_w8a8_channel,torch.float16,13,128,7168,256,8,0,0,asm,10006+20102,202.0065
gfx938,int8_w8a8_channel,torch.float16,14,128,7168,256,8,0,0,asm,10008+20102,207.7829
gfx938,int8_w8a8_channel,torch.float16,15,128,7168,256,8,0,0,asm,10008+20102,211.6187
gfx938,int8_w8a8_channel,torch.float16,16,128,7168,256,8,0,0,asm,10008+20102,215.549
gfx938,int8_w8a8_channel,torch.float16,17,128,7168,256,8,0,0,asm,10008+20102,216.2229
gfx938,int8_w8a8_channel,torch.float16,18,128,7168,256,8,0,0,asm,10008+20102,225.1172
gfx938,int8_w8a8_channel,torch.float16,20,128,7168,256,8,0,0,asm,10007+20102,252.6248
gfx938,int8_w8a8_channel,torch.float16,24,128,7168,256,8,0,0,asm,10009+20102,270.0401
gfx938,int8_w8a8_channel,torch.float16,28,128,7168,256,8,0,0,asm,10006+20102,322.4983
gfx938,int8_w8a8_channel,torch.float16,32,128,7168,256,8,0,0,asm,10009+20102,333.6121
gfx938,int8_w8a8_channel,torch.float16,34,128,7168,256,8,0,0,asm,10008+20102,326.2245
gfx938,int8_w8a8_channel,torch.float16,36,128,7168,256,8,0,0,asm,10008+20102,336.0665
gfx938,int8_w8a8_channel,torch.float16,40,128,7168,256,8,0,0,asm,10006+20102,360.2305
gfx938,int8_w8a8_channel,torch.float16,44,128,7168,256,8,0,0,asm,10006+20102,370.0438
gfx938,int8_w8a8_channel,torch.float16,48,128,7168,256,8,0,0,asm,10008+20102,376.5956
gfx938,int8_w8a8_channel,torch.float16,56,128,7168,256,8,0,0,asm,10009+20102,390.4745
gfx938,int8_w8a8_channel,torch.float16,64,128,7168,256,8,0,0,asm,10006+20102,412.9934
gfx938,int8_w8a8_channel,torch.float16,68,128,7168,256,8,0,0,asm,10007+20102,438.704
gfx938,int8_w8a8_channel,torch.float16,72,128,7168,256,8,0,0,asm,10007+20102,444.9891
gfx938,int8_w8a8_channel,torch.float16,80,128,7168,256,8,0,0,asm,10006+20001,460.9659
gfx938,int8_w8a8_channel,torch.float16,88,128,7168,256,8,0,0,asm,10008+20102,447.6596
gfx938,int8_w8a8_channel,torch.float16,96,128,7168,256,8,0,0,asm,10008+20102,449.785
gfx938,int8_w8a8_channel,torch.float16,104,128,7168,256,8,0,0,asm,10008+20102,456.8659
gfx938,int8_w8a8_channel,torch.float16,112,128,7168,256,8,0,0,asm,10008+20102,459.0649
gfx938,int8_w8a8_channel,torch.float16,128,128,7168,256,8,0,0,asm,10009+20102,469.3418
gfx938,int8_w8a8_channel,torch.float16,144,128,7168,256,8,0,0,asm,10006+20102,487.4953
gfx938,int8_w8a8_channel,torch.float16,160,128,7168,256,8,0,0,asm,10007+20102,494.2935
gfx938,int8_w8a8_channel,torch.float16,192,128,7168,256,8,0,0,asm,10007+20102,503.7376
gfx938,int8_w8a8_channel,torch.float16,224,128,7168,256,8,0,0,asm,10006+20102,507.8321
gfx938,int8_w8a8_channel,torch.float16,256,128,7168,256,8,0,0,asm,10008+20102,520.7877
gfx938,int8_w8a8_channel,torch.float16,320,128,7168,256,8,0,0,asm,10008+20102,539.2761
gfx938,int8_w8a8_channel,torch.float16,384,128,7168,256,8,0,0,asm,10008+20102,544.8087
gfx938,int8_w8a8_channel,torch.float16,448,128,7168,256,8,0,0,asm,10009+20102,573.4907
gfx938,int8_w8a8_channel,torch.float16,512,128,7168,256,8,0,0,asm,10011+20102,596.1433
gfx938,int8_w8a8_channel,torch.float16,576,128,7168,256,8,0,0,asm,11005+21102,656.0282
gfx938,int8_w8a8_channel,torch.float16,640,128,7168,256,8,0,0,asm,11007+21102,635.9422
gfx938,int8_w8a8_channel,torch.float16,704,128,7168,256,8,0,0,asm,11007+21102,645.1769
gfx938,int8_w8a8_channel,torch.float16,768,128,7168,256,8,0,0,asm,11007+21102,657.2918
gfx938,int8_w8a8_channel,torch.float16,832,128,7168,256,8,0,0,asm,11007+21102,672.0241
gfx938,int8_w8a8_channel,torch.float16,896,128,7168,256,8,0,0,asm,11002+21102,704.436
gfx938,int8_w8a8_channel,torch.float16,960,128,7168,256,8,0,0,asm,11007+21102,732.9018
gfx938,int8_w8a8_channel,torch.float16,1024,128,7168,256,8,0,0,asm,11007+21102,771.3553
gfx938,int8_w8a8_channel,torch.float16,1152,128,7168,256,8,0,0,asm,11007+21102,876.3761
gfx938,int8_w8a8_channel,torch.float16,1280,128,7168,256,8,0,0,asm,11005+21102,874.5662
gfx938,int8_w8a8_channel,torch.float16,1408,128,7168,256,8,0,0,asm,11007+21102,920.0681
gfx938,int8_w8a8_channel,torch.float16,1536,128,7168,256,8,0,0,asm,11005+21102,1005.6719
gfx938,int8_w8a8_channel,torch.float16,1664,128,7168,256,8,0,0,asm,11003+21102,1021.9835
gfx938,int8_w8a8_channel,torch.float16,1792,128,7168,256,8,0,0,asm,11005+21102,1059.247
gfx938,int8_w8a8_channel,torch.float16,1920,128,7168,256,8,0,0,asm,11005+21102,1114.7504
gfx938,int8_w8a8_channel,torch.float16,2048,128,7168,256,8,0,0,asm,11005+21102,1168.9655
gfx938,int8_w8a8_channel,torch.float16,2304,128,7168,256,8,0,0,asm,11003+21102,1312.8102
gfx938,int8_w8a8_channel,torch.float16,2560,128,7168,256,8,0,0,asm,11005+21102,1403.0569
gfx938,int8_w8a8_channel,torch.float16,2816,128,7168,256,8,0,0,asm,11005+21102,1498.835
gfx938,int8_w8a8_channel,torch.float16,3072,128,7168,256,8,0,0,asm,11003+21102,1613.8125
gfx938,int8_w8a8_channel,torch.float16,3328,128,7168,256,8,0,0,asm,13001+23001,1700.2946
gfx938,int8_w8a8_channel,torch.float16,3584,128,7168,256,8,0,0,asm,13001+23001,1783.0265
gfx938,int8_w8a8_channel,torch.float16,3840,128,7168,256,8,0,0,asm,12005+22101,1873.9472
gfx938,int8_w8a8_channel,torch.float16,4096,128,7168,256,8,0,0,asm,12005+22101,2008.9948
gfx938,int8_w8a8_channel,torch.float16,4608,128,7168,256,8,0,0,asm,11005+21102,2286.6552
gfx938,int8_w8a8_channel,torch.float16,5120,128,7168,256,8,0,0,asm,12005+22101,2463.2891
gfx938,int8_w8a8_channel,torch.float16,5632,128,7168,256,8,0,0,asm,12005+22101,2637.5543
gfx938,int8_w8a8_channel,torch.float16,6144,128,7168,256,8,0,0,asm,12005+22101,2873.6969
gfx938,int8_w8a8_channel,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23100,3049.9628
gfx938,int8_w8a8_channel,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23101,3153.4823
gfx938,int8_w8a8_channel,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23101,3301.7073
gfx938,int8_w8a8_channel,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23101,3585.6404
gfx938,int8_w8a8_channel,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23101,4373.7192
gfx938,int8_w8a8_channel,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23101,5123.7714
gfx938,int8_w8a8_channel,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23101,5923.3454
gfx938,int8_w8a8_channel,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23101,6549.2382
gfx938,int8_w8a8_channel,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23101,7048.0915
gfx938,int8_w8a8_channel,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23101,9605.6151
gfx938,int8_w8a8_channel,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23101,12610.251
gfx938,int8_w8a8_channel,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,14891.5836
gfx938,int8_w8a8_channel,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23101,17871.5385
gfx938,int8_w8a8_channel,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23101,20962.4344
gfx938,int8_w8a8_channel,torch.float16,65536,128,7168,256,8,0,0,asm,13001+23101,24165.9529
gfx938,int8_w8a8_channel,torch.float16,1,256,7168,256,8,0,0,asm,10006+20001,68.5505
gfx938,int8_w8a8_channel,torch.float16,2,256,7168,256,8,0,0,asm,10008+20001,100.8147
gfx938,int8_w8a8_channel,torch.float16,3,256,7168,256,8,0,0,asm,10011+20001,133.5213
gfx938,int8_w8a8_channel,torch.float16,4,256,7168,256,8,0,0,asm,10011+20001,160.5774
gfx938,int8_w8a8_channel,torch.float16,5,256,7168,256,8,0,0,asm,10007+20001,190.2981
gfx938,int8_w8a8_channel,torch.float16,6,256,7168,256,8,0,0,asm,10008+20001,201.7628
gfx938,int8_w8a8_channel,torch.float16,7,256,7168,256,8,0,0,asm,10008+20001,221.2054
gfx938,int8_w8a8_channel,torch.float16,8,256,7168,256,8,0,0,asm,10011+20001,237.7383
gfx938,int8_w8a8_channel,torch.float16,9,256,7168,256,8,0,0,asm,10011+20001,256.8013
gfx938,int8_w8a8_channel,torch.float16,10,256,7168,256,8,0,0,asm,10008+20001,272.7689
gfx938,int8_w8a8_channel,torch.float16,11,256,7168,256,8,0,0,asm,10006+20001,300.0406
gfx938,int8_w8a8_channel,torch.float16,12,256,7168,256,8,0,0,asm,10008+20001,305.9437
gfx938,int8_w8a8_channel,torch.float16,13,256,7168,256,8,0,0,asm,10008+20001,316.1973
gfx938,int8_w8a8_channel,torch.float16,14,256,7168,256,8,0,0,asm,10011+20001,339.9413
gfx938,int8_w8a8_channel,torch.float16,15,256,7168,256,8,0,0,asm,10011+20001,351.3606
gfx938,int8_w8a8_channel,torch.float16,16,256,7168,256,8,0,0,asm,10011+20001,357.4739
gfx938,int8_w8a8_channel,torch.float16,17,256,7168,256,8,0,0,asm,10008+20001,361.1618
gfx938,int8_w8a8_channel,torch.float16,18,256,7168,256,8,0,0,asm,10008+20001,374.265
gfx938,int8_w8a8_channel,torch.float16,20,256,7168,256,8,0,0,asm,10008+20001,401.4923
gfx938,int8_w8a8_channel,torch.float16,24,256,7168,256,8,0,0,asm,10008+20001,453.172
gfx938,int8_w8a8_channel,torch.float16,28,256,7168,256,8,0,0,asm,10006+20001,517.5313
gfx938,int8_w8a8_channel,torch.float16,32,256,7168,256,8,0,0,asm,10008+20001,544.9005
gfx938,int8_w8a8_channel,torch.float16,34,256,7168,256,8,0,0,asm,10008+20001,544.9203
gfx938,int8_w8a8_channel,torch.float16,36,256,7168,256,8,0,0,asm,10008+20001,560.8699
gfx938,int8_w8a8_channel,torch.float16,40,256,7168,256,8,0,0,asm,10006+20001,585.8207
gfx938,int8_w8a8_channel,torch.float16,44,256,7168,256,8,0,0,asm,10009+20001,609.8321
gfx938,int8_w8a8_channel,torch.float16,48,256,7168,256,8,0,0,asm,10008+20001,621.0491
gfx938,int8_w8a8_channel,torch.float16,56,256,7168,256,8,0,0,asm,10008+20001,655.6489
gfx938,int8_w8a8_channel,torch.float16,64,256,7168,256,8,0,0,asm,10008+20001,678.5654
gfx938,int8_w8a8_channel,torch.float16,68,256,7168,256,8,0,0,asm,10006+20001,704.5449
gfx938,int8_w8a8_channel,torch.float16,72,256,7168,256,8,0,0,asm,10006+20001,699.4441
gfx938,int8_w8a8_channel,torch.float16,80,256,7168,256,8,0,0,asm,10008+20001,720.0905
gfx938,int8_w8a8_channel,torch.float16,88,256,7168,256,8,0,0,asm,10006+20001,750.3095
gfx938,int8_w8a8_channel,torch.float16,96,256,7168,256,8,0,0,asm,10006+20001,754.8377
gfx938,int8_w8a8_channel,torch.float16,104,256,7168,256,8,0,0,asm,10008+20001,773.6645
gfx938,int8_w8a8_channel,torch.float16,112,256,7168,256,8,0,0,asm,10008+20001,774.8759
gfx938,int8_w8a8_channel,torch.float16,128,256,7168,256,8,0,0,asm,10008+20001,789.6589
gfx938,int8_w8a8_channel,torch.float16,144,256,7168,256,8,0,0,asm,10008+20001,797.6933
gfx938,int8_w8a8_channel,torch.float16,160,256,7168,256,8,0,0,asm,10008+20001,807.9442
gfx938,int8_w8a8_channel,torch.float16,192,256,7168,256,8,0,0,asm,10008+20001,820.3015
gfx938,int8_w8a8_channel,torch.float16,224,256,7168,256,8,0,0,asm,10008+20001,830.4963
gfx938,int8_w8a8_channel,torch.float16,256,256,7168,256,8,0,0,asm,10008+20001,845.8104
gfx938,int8_w8a8_channel,torch.float16,320,256,7168,256,8,0,0,asm,10009+20001,880.0833
gfx938,int8_w8a8_channel,torch.float16,384,256,7168,256,8,0,0,asm,10011+20001,907.5741
gfx938,int8_w8a8_channel,torch.float16,448,256,7168,256,8,0,0,asm,11004+21001,925.8605
gfx938,int8_w8a8_channel,torch.float16,512,256,7168,256,8,0,0,asm,11004+21001,949.4826
gfx938,int8_w8a8_channel,torch.float16,576,256,7168,256,8,0,0,asm,11004+21001,1004.8272
gfx938,int8_w8a8_channel,torch.float16,640,256,7168,256,8,0,0,asm,11004+21001,981.5911
gfx938,int8_w8a8_channel,torch.float16,704,256,7168,256,8,0,0,asm,11004+21001,1006.4282
gfx938,int8_w8a8_channel,torch.float16,768,256,7168,256,8,0,0,asm,11007+21001,1028.9819
gfx938,int8_w8a8_channel,torch.float16,832,256,7168,256,8,0,0,asm,11007+21001,1062.8699
gfx938,int8_w8a8_channel,torch.float16,896,256,7168,256,8,0,0,asm,11005+21001,1111.3783
gfx938,int8_w8a8_channel,torch.float16,960,256,7168,256,8,0,0,asm,11005+21001,1172.5677
gfx938,int8_w8a8_channel,torch.float16,1024,256,7168,256,8,0,0,asm,11005+21001,1198.2545
gfx938,int8_w8a8_channel,torch.float16,1152,256,7168,256,8,0,0,asm,12005+22001,1312.7485
gfx938,int8_w8a8_channel,torch.float16,1280,256,7168,256,8,0,0,asm,12003+22001,1305.7395
gfx938,int8_w8a8_channel,torch.float16,1408,256,7168,256,8,0,0,asm,12005+22001,1344.1193
gfx938,int8_w8a8_channel,torch.float16,1536,256,7168,256,8,0,0,asm,12000+22001,1382.4336
gfx938,int8_w8a8_channel,torch.float16,1664,256,7168,256,8,0,0,asm,12005+22001,1410.499
gfx938,int8_w8a8_channel,torch.float16,1792,256,7168,256,8,0,0,asm,12001+22001,1492.3818
gfx938,int8_w8a8_channel,torch.float16,1920,256,7168,256,8,0,0,asm,12005+22001,1537.2226
gfx938,int8_w8a8_channel,torch.float16,2048,256,7168,256,8,0,0,asm,12005+22001,1697.7758
gfx938,int8_w8a8_channel,torch.float16,2304,256,7168,256,8,0,0,asm,12005+22001,1956.1871
gfx938,int8_w8a8_channel,torch.float16,2560,256,7168,256,8,0,0,asm,13001+23001,2038.5128
gfx938,int8_w8a8_channel,torch.float16,2816,256,7168,256,8,0,0,asm,13001+23001,2095.8748
gfx938,int8_w8a8_channel,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23001,2151.5135
gfx938,int8_w8a8_channel,torch.float16,3328,256,7168,256,8,0,0,asm,13001+23001,2219.1767
gfx938,int8_w8a8_channel,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23001,2287.4431
gfx938,int8_w8a8_channel,torch.float16,3840,256,7168,256,8,0,0,asm,13001+23001,2475.5367
gfx938,int8_w8a8_channel,torch.float16,4096,256,7168,256,8,0,0,asm,12005+22001,2775.478
gfx938,int8_w8a8_channel,torch.float16,4608,256,7168,256,8,0,0,asm,12001+22001,3167.0785
gfx938,int8_w8a8_channel,torch.float16,5120,256,7168,256,8,0,0,asm,12005+22001,3359.1433
gfx938,int8_w8a8_channel,torch.float16,5632,256,7168,256,8,0,0,asm,12001+22001,3549.321
gfx938,int8_w8a8_channel,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23001,3848.2614
gfx938,int8_w8a8_channel,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23001,3960.4866
gfx938,int8_w8a8_channel,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23001,4072.7199
gfx938,int8_w8a8_channel,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23001,4313.7529
gfx938,int8_w8a8_channel,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23001,4792.6391
gfx938,int8_w8a8_channel,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23001,5855.5025
gfx938,int8_w8a8_channel,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23001,6805.8167
gfx938,int8_w8a8_channel,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23001,7873.4718
gfx938,int8_w8a8_channel,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23001,8847.507
gfx938,int8_w8a8_channel,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23001,9618.6136
gfx938,int8_w8a8_channel,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23001,12937.4104
gfx938,int8_w8a8_channel,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23001,16973.6735
gfx938,int8_w8a8_channel,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23001,21009.7928
gfx938,int8_w8a8_channel,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23001,24983.1394
gfx938,int8_w8a8_channel,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23001,29099.3916
gfx938,int8_w8a8_channel,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23001,33141.3321
gfx938,f8_w8a8_channel,torch.float16,1,128,7168,256,8,0,0,asm,10000+20101,63.2993
gfx938,f8_w8a8_channel,torch.float16,2,128,7168,256,8,0,0,asm,10002+20102,75.3779
gfx938,f8_w8a8_channel,torch.float16,3,128,7168,256,8,0,0,asm,10008+20102,83.7752
gfx938,f8_w8a8_channel,torch.float16,4,128,7168,256,8,0,0,asm,10002+20102,102.3926
gfx938,f8_w8a8_channel,torch.float16,5,128,7168,256,8,0,0,asm,10011+20102,124.0745
gfx938,f8_w8a8_channel,torch.float16,6,128,7168,256,8,0,0,asm,10011+20102,132.456
gfx938,f8_w8a8_channel,torch.float16,7,128,7168,256,8,0,0,asm,10011+20102,141.4159
gfx938,f8_w8a8_channel,torch.float16,8,128,7168,256,8,0,0,asm,10008+20102,145.7236
gfx938,f8_w8a8_channel,torch.float16,9,128,7168,256,8,0,0,asm,10008+20102,155.8406
gfx938,f8_w8a8_channel,torch.float16,10,128,7168,256,8,0,0,asm,10009+20102,169.2886
gfx938,f8_w8a8_channel,torch.float16,11,128,7168,256,8,0,0,asm,10006+20102,195.3932
gfx938,f8_w8a8_channel,torch.float16,12,128,7168,256,8,0,0,asm,10006+20102,197.5265
gfx938,f8_w8a8_channel,torch.float16,13,128,7168,256,8,0,0,asm,10006+20102,202.384
gfx938,f8_w8a8_channel,torch.float16,14,128,7168,256,8,0,0,asm,10009+20102,208.2793
gfx938,f8_w8a8_channel,torch.float16,15,128,7168,256,8,0,0,asm,10008+20102,211.4998
gfx938,f8_w8a8_channel,torch.float16,16,128,7168,256,8,0,0,asm,10008+20102,216.0495
gfx938,f8_w8a8_channel,torch.float16,17,128,7168,256,8,0,0,asm,10009+20102,217.7286
gfx938,f8_w8a8_channel,torch.float16,18,128,7168,256,8,0,0,asm,10008+20102,226.1962
gfx938,f8_w8a8_channel,torch.float16,20,128,7168,256,8,0,0,asm,10011+20102,250.2782
gfx938,f8_w8a8_channel,torch.float16,24,128,7168,256,8,0,0,asm,10008+20102,269.9047
gfx938,f8_w8a8_channel,torch.float16,28,128,7168,256,8,0,0,asm,10006+20102,324.0327
gfx938,f8_w8a8_channel,torch.float16,32,128,7168,256,8,0,0,asm,10008+20102,332.3731
gfx938,f8_w8a8_channel,torch.float16,34,128,7168,256,8,0,0,asm,10008+20102,323.6891
gfx938,f8_w8a8_channel,torch.float16,36,128,7168,256,8,0,0,asm,10008+20102,335.5496
gfx938,f8_w8a8_channel,torch.float16,40,128,7168,256,8,0,0,asm,10006+20102,360.0131
gfx938,f8_w8a8_channel,torch.float16,44,128,7168,256,8,0,0,asm,10006+20102,368.4807
gfx938,f8_w8a8_channel,torch.float16,48,128,7168,256,8,0,0,asm,10006+20102,373.211
gfx938,f8_w8a8_channel,torch.float16,56,128,7168,256,8,0,0,asm,10008+20102,387.0038
gfx938,f8_w8a8_channel,torch.float16,64,128,7168,256,8,0,0,asm,10006+20102,412.3411
gfx938,f8_w8a8_channel,torch.float16,68,128,7168,256,8,0,0,asm,10009+20102,427.3523
gfx938,f8_w8a8_channel,torch.float16,72,128,7168,256,8,0,0,asm,10007+20102,429.8217
gfx938,f8_w8a8_channel,torch.float16,80,128,7168,256,8,0,0,asm,10006+20102,436.6703
gfx938,f8_w8a8_channel,torch.float16,88,128,7168,256,8,0,0,asm,10009+20102,450.7544
gfx938,f8_w8a8_channel,torch.float16,96,128,7168,256,8,0,0,asm,10008+20102,448.3286
gfx938,f8_w8a8_channel,torch.float16,104,128,7168,256,8,0,0,asm,10008+20102,455.746
gfx938,f8_w8a8_channel,torch.float16,112,128,7168,256,8,0,0,asm,10008+20102,460.9111
gfx938,f8_w8a8_channel,torch.float16,128,128,7168,256,8,0,0,asm,10008+20102,473.5223
gfx938,f8_w8a8_channel,torch.float16,144,128,7168,256,8,0,0,asm,10006+20102,489.0501
gfx938,f8_w8a8_channel,torch.float16,160,128,7168,256,8,0,0,asm,10006+20102,494.0089
gfx938,f8_w8a8_channel,torch.float16,192,128,7168,256,8,0,0,asm,10007+20102,503.0324
gfx938,f8_w8a8_channel,torch.float16,224,128,7168,256,8,0,0,asm,10007+20102,509.8447
gfx938,f8_w8a8_channel,torch.float16,256,128,7168,256,8,0,0,asm,10006+20102,519.6637
gfx938,f8_w8a8_channel,torch.float16,320,128,7168,256,8,0,0,asm,10011+20102,541.1159
gfx938,f8_w8a8_channel,torch.float16,384,128,7168,256,8,0,0,asm,10008+20102,544.4964
gfx938,f8_w8a8_channel,torch.float16,448,128,7168,256,8,0,0,asm,10008+20102,571.483
gfx938,f8_w8a8_channel,torch.float16,512,128,7168,256,8,0,0,asm,10011+20102,594.417
gfx938,f8_w8a8_channel,torch.float16,576,128,7168,256,8,0,0,asm,11007+21102,655.6798
gfx938,f8_w8a8_channel,torch.float16,640,128,7168,256,8,0,0,asm,11007+21102,642.2806
gfx938,f8_w8a8_channel,torch.float16,704,128,7168,256,8,0,0,asm,11005+21102,654.5883
gfx938,f8_w8a8_channel,torch.float16,768,128,7168,256,8,0,0,asm,11007+21102,664.4925
gfx938,f8_w8a8_channel,torch.float16,832,128,7168,256,8,0,0,asm,11002+21102,675.4143
gfx938,f8_w8a8_channel,torch.float16,896,128,7168,256,8,0,0,asm,11007+21102,724.4094
gfx938,f8_w8a8_channel,torch.float16,960,128,7168,256,8,0,0,asm,11007+21102,733.8166
gfx938,f8_w8a8_channel,torch.float16,1024,128,7168,256,8,0,0,asm,11005+21102,792.8112
gfx938,f8_w8a8_channel,torch.float16,1152,128,7168,256,8,0,0,asm,11007+21102,889.0462
gfx938,f8_w8a8_channel,torch.float16,1280,128,7168,256,8,0,0,asm,11007+21102,898.7677
gfx938,f8_w8a8_channel,torch.float16,1408,128,7168,256,8,0,0,asm,11007+21102,928.2732
gfx938,f8_w8a8_channel,torch.float16,1536,128,7168,256,8,0,0,asm,12005+22001,989.7838
gfx938,f8_w8a8_channel,torch.float16,1664,128,7168,256,8,0,0,asm,11007+21102,1037.5527
gfx938,f8_w8a8_channel,torch.float16,1792,128,7168,256,8,0,0,asm,11005+21102,1076.8675
gfx938,f8_w8a8_channel,torch.float16,1920,128,7168,256,8,0,0,asm,11005+21102,1136.2149
gfx938,f8_w8a8_channel,torch.float16,2048,128,7168,256,8,0,0,asm,11005+21102,1185.9542
gfx938,f8_w8a8_channel,torch.float16,2304,128,7168,256,8,0,0,asm,11005+21102,1348.5463
gfx938,f8_w8a8_channel,torch.float16,2560,128,7168,256,8,0,0,asm,11005+21102,1420.4804
gfx938,f8_w8a8_channel,torch.float16,2816,128,7168,256,8,0,0,asm,11005+21102,1525.0421
gfx938,f8_w8a8_channel,torch.float16,3072,128,7168,256,8,0,0,asm,13001+23001,1643.3144
gfx938,f8_w8a8_channel,torch.float16,3328,128,7168,256,8,0,0,asm,13001+23001,1692.1798
gfx938,f8_w8a8_channel,torch.float16,3584,128,7168,256,8,0,0,asm,13001+23001,1774.5672
gfx938,f8_w8a8_channel,torch.float16,3840,128,7168,256,8,0,0,asm,12005+22101,1901.4262
gfx938,f8_w8a8_channel,torch.float16,4096,128,7168,256,8,0,0,asm,12005+22101,2048.3671
gfx938,f8_w8a8_channel,torch.float16,4608,128,7168,256,8,0,0,asm,11005+21102,2313.0716
gfx938,f8_w8a8_channel,torch.float16,5120,128,7168,256,8,0,0,asm,12001+22101,2501.2432
gfx938,f8_w8a8_channel,torch.float16,5632,128,7168,256,8,0,0,asm,12005+22001,2673.3164
gfx938,f8_w8a8_channel,torch.float16,6144,128,7168,256,8,0,0,asm,12005+22101,2910.5216
gfx938,f8_w8a8_channel,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23001,3051.8871
gfx938,f8_w8a8_channel,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23001,3169.9625
gfx938,f8_w8a8_channel,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23001,3321.1865
gfx938,f8_w8a8_channel,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23101,3639.3636
gfx938,f8_w8a8_channel,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23101,4414.8517
gfx938,f8_w8a8_channel,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23101,5191.0948
gfx938,f8_w8a8_channel,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23100,6015.8587
gfx938,f8_w8a8_channel,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23101,6643.1382
gfx938,f8_w8a8_channel,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23101,7147.6777
gfx938,f8_w8a8_channel,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23101,9742.9246
gfx938,f8_w8a8_channel,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23101,12818.7074
gfx938,f8_w8a8_channel,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15088.9874
gfx938,f8_w8a8_channel,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23101,18123.5682
gfx938,f8_w8a8_channel,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23101,21277.0495
gfx938,f8_w8a8_channel,torch.float16,65536,128,7168,256,8,0,0,asm,13001+23101,24574.4229
gfx938,f8_w8a8_channel,torch.float16,1,256,7168,256,8,0,0,asm,10002+20001,71.3773
gfx938,f8_w8a8_channel,torch.float16,2,256,7168,256,8,0,0,asm,10008+20001,103.0325
gfx938,f8_w8a8_channel,torch.float16,3,256,7168,256,8,0,0,asm,10011+20001,132.8016
gfx938,f8_w8a8_channel,torch.float16,4,256,7168,256,8,0,0,asm,10008+20001,161.5924
gfx938,f8_w8a8_channel,torch.float16,5,256,7168,256,8,0,0,asm,10006+20001,188.8424
gfx938,f8_w8a8_channel,torch.float16,6,256,7168,256,8,0,0,asm,10008+20001,203.0139
gfx938,f8_w8a8_channel,torch.float16,7,256,7168,256,8,0,0,asm,10008+20001,221.2909
gfx938,f8_w8a8_channel,torch.float16,8,256,7168,256,8,0,0,asm,10011+20001,237.7794
gfx938,f8_w8a8_channel,torch.float16,9,256,7168,256,8,0,0,asm,10011+20001,257.2902
gfx938,f8_w8a8_channel,torch.float16,10,256,7168,256,8,0,0,asm,10011+20001,272.7781
gfx938,f8_w8a8_channel,torch.float16,11,256,7168,256,8,0,0,asm,10006+20001,298.4969
gfx938,f8_w8a8_channel,torch.float16,12,256,7168,256,8,0,0,asm,10009+20001,307.2374
gfx938,f8_w8a8_channel,torch.float16,13,256,7168,256,8,0,0,asm,10008+20001,317.3495
gfx938,f8_w8a8_channel,torch.float16,14,256,7168,256,8,0,0,asm,10011+20001,339.3927
gfx938,f8_w8a8_channel,torch.float16,15,256,7168,256,8,0,0,asm,10011+20001,349.8841
gfx938,f8_w8a8_channel,torch.float16,16,256,7168,256,8,0,0,asm,10011+20001,358.5241
gfx938,f8_w8a8_channel,torch.float16,17,256,7168,256,8,0,0,asm,10009+20001,361.753
gfx938,f8_w8a8_channel,torch.float16,18,256,7168,256,8,0,0,asm,10008+20001,375.0472
gfx938,f8_w8a8_channel,torch.float16,20,256,7168,256,8,0,0,asm,10006+20001,403.993
gfx938,f8_w8a8_channel,torch.float16,24,256,7168,256,8,0,0,asm,10008+20001,453.9264
gfx938,f8_w8a8_channel,torch.float16,28,256,7168,256,8,0,0,asm,10008+20001,516.5211
gfx938,f8_w8a8_channel,torch.float16,32,256,7168,256,8,0,0,asm,10009+20001,546.433
gfx938,f8_w8a8_channel,torch.float16,34,256,7168,256,8,0,0,asm,10011+20001,547.1689
gfx938,f8_w8a8_channel,torch.float16,36,256,7168,256,8,0,0,asm,10008+20001,562.6345
gfx938,f8_w8a8_channel,torch.float16,40,256,7168,256,8,0,0,asm,10006+20001,586.7441
gfx938,f8_w8a8_channel,torch.float16,44,256,7168,256,8,0,0,asm,10008+20001,609.3898
gfx938,f8_w8a8_channel,torch.float16,48,256,7168,256,8,0,0,asm,10008+20001,623.9783
gfx938,f8_w8a8_channel,torch.float16,56,256,7168,256,8,0,0,asm,10008+20001,655.9684
gfx938,f8_w8a8_channel,torch.float16,64,256,7168,256,8,0,0,asm,10006+20001,680.2431
gfx938,f8_w8a8_channel,torch.float16,68,256,7168,256,8,0,0,asm,10006+20001,686.086
gfx938,f8_w8a8_channel,torch.float16,72,256,7168,256,8,0,0,asm,10012+20001,720.2646
gfx938,f8_w8a8_channel,torch.float16,80,256,7168,256,8,0,0,asm,10008+20001,771.0738
gfx938,f8_w8a8_channel,torch.float16,88,256,7168,256,8,0,0,asm,10008+20001,745.2486
gfx938,f8_w8a8_channel,torch.float16,96,256,7168,256,8,0,0,asm,10006+20001,755.5114
gfx938,f8_w8a8_channel,torch.float16,104,256,7168,256,8,0,0,asm,10008+20001,770.5044
gfx938,f8_w8a8_channel,torch.float16,112,256,7168,256,8,0,0,asm,10008+20001,775.8668
gfx938,f8_w8a8_channel,torch.float16,128,256,7168,256,8,0,0,asm,10008+20001,789.3307
gfx938,f8_w8a8_channel,torch.float16,144,256,7168,256,8,0,0,asm,10008+20001,801.6573
gfx938,f8_w8a8_channel,torch.float16,160,256,7168,256,8,0,0,asm,10008+20001,808.8431
gfx938,f8_w8a8_channel,torch.float16,192,256,7168,256,8,0,0,asm,10008+20001,822.915
gfx938,f8_w8a8_channel,torch.float16,224,256,7168,256,8,0,0,asm,10008+20001,833.1515
gfx938,f8_w8a8_channel,torch.float16,256,256,7168,256,8,0,0,asm,10008+20001,843.5744
gfx938,f8_w8a8_channel,torch.float16,320,256,7168,256,8,0,0,asm,10008+20001,875.8173
gfx938,f8_w8a8_channel,torch.float16,384,256,7168,256,8,0,0,asm,11002+21001,903.3123
gfx938,f8_w8a8_channel,torch.float16,448,256,7168,256,8,0,0,asm,11004+21001,923.768
gfx938,f8_w8a8_channel,torch.float16,512,256,7168,256,8,0,0,asm,11004+21001,945.9661
gfx938,f8_w8a8_channel,torch.float16,576,256,7168,256,8,0,0,asm,11004+21001,1004.9307
gfx938,f8_w8a8_channel,torch.float16,640,256,7168,256,8,0,0,asm,11004+21001,984.5559
gfx938,f8_w8a8_channel,torch.float16,704,256,7168,256,8,0,0,asm,11004+21001,1009.4000
gfx938,f8_w8a8_channel,torch.float16,768,256,7168,256,8,0,0,asm,11007+21001,1039.9012
gfx938,f8_w8a8_channel,torch.float16,832,256,7168,256,8,0,0,asm,11005+21001,1073.4592
gfx938,f8_w8a8_channel,torch.float16,896,256,7168,256,8,0,0,asm,11005+21001,1100.2193
gfx938,f8_w8a8_channel,torch.float16,960,256,7168,256,8,0,0,asm,11003+21001,1159.3657
gfx938,f8_w8a8_channel,torch.float16,1024,256,7168,256,8,0,0,asm,11005+21001,1212.9271
gfx938,f8_w8a8_channel,torch.float16,1152,256,7168,256,8,0,0,asm,12005+22001,1301.3286
gfx938,f8_w8a8_channel,torch.float16,1280,256,7168,256,8,0,0,asm,12000+22001,1317.5435
gfx938,f8_w8a8_channel,torch.float16,1408,256,7168,256,8,0,0,asm,12005+22001,1342.2792
gfx938,f8_w8a8_channel,torch.float16,1536,256,7168,256,8,0,0,asm,12005+22001,1367.209
gfx938,f8_w8a8_channel,torch.float16,1664,256,7168,256,8,0,0,asm,12005+22001,1409.4242
gfx938,f8_w8a8_channel,torch.float16,1792,256,7168,256,8,0,0,asm,12005+22001,1489.8281
gfx938,f8_w8a8_channel,torch.float16,1920,256,7168,256,8,0,0,asm,12005+22001,1528.3161
gfx938,f8_w8a8_channel,torch.float16,2048,256,7168,256,8,0,0,asm,12001+22001,1688.9472
gfx938,f8_w8a8_channel,torch.float16,2304,256,7168,256,8,0,0,asm,12005+22001,1951.8713
gfx938,f8_w8a8_channel,torch.float16,2560,256,7168,256,8,0,0,asm,13001+23001,2031.2743
gfx938,f8_w8a8_channel,torch.float16,2816,256,7168,256,8,0,0,asm,13001+23001,2085.2615
gfx938,f8_w8a8_channel,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23001,2147.5381
gfx938,f8_w8a8_channel,torch.float16,3328,256,7168,256,8,0,0,asm,13001+23001,2207.5995
gfx938,f8_w8a8_channel,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23001,2290.0607
gfx938,f8_w8a8_channel,torch.float16,3840,256,7168,256,8,0,0,asm,13001+23001,2455.1266
gfx938,f8_w8a8_channel,torch.float16,4096,256,7168,256,8,0,0,asm,12005+22001,2762.0217
gfx938,f8_w8a8_channel,torch.float16,4608,256,7168,256,8,0,0,asm,12001+22001,3148.4202
gfx938,f8_w8a8_channel,torch.float16,5120,256,7168,256,8,0,0,asm,12001+22001,3345.6214
gfx938,f8_w8a8_channel,torch.float16,5632,256,7168,256,8,0,0,asm,12001+22001,3531.3437
gfx938,f8_w8a8_channel,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23001,3833.4307
gfx938,f8_w8a8_channel,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23001,3933.061
gfx938,f8_w8a8_channel,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23001,4047.1816
gfx938,f8_w8a8_channel,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23001,4302.8155
gfx938,f8_w8a8_channel,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23001,4770.8874
gfx938,f8_w8a8_channel,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23001,5814.4894
gfx938,f8_w8a8_channel,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23001,6783.9214
gfx938,f8_w8a8_channel,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23001,7833.6239
gfx938,f8_w8a8_channel,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23001,8799.1627
gfx938,f8_w8a8_channel,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23001,9562.2695
gfx938,f8_w8a8_channel,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23001,12888.3568
gfx938,f8_w8a8_channel,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23001,16903.9514
gfx938,f8_w8a8_channel,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23001,20904.6085
gfx938,f8_w8a8_channel,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23001,24866.1601
gfx938,f8_w8a8_channel,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23001,28986.4682
gfx938,f8_w8a8_channel,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23001,33012.5482
gfx938,f8_w8a8_channel,torch.float16,1,352,4096,128,8,0,0,asm,10001+20000,63.0496
gfx938,f8_w8a8_channel,torch.float16,2,352,4096,128,8,0,0,asm,10001+20000,89.0958
gfx938,f8_w8a8_channel,torch.float16,4,352,4096,128,8,0,0,asm,10006+20000,128.5736
gfx938,f8_w8a8_channel,torch.float16,6,352,4096,128,8,0,0,asm,10006+20000,161.6681
gfx938,f8_w8a8_channel,torch.float16,8,352,4096,128,8,0,0,asm,10007+20000,193.1626
gfx938,f8_w8a8_channel,torch.float16,12,352,4096,128,8,0,0,asm,10006+20001,237.1877
gfx938,f8_w8a8_channel,torch.float16,16,352,4096,128,8,0,0,asm,10006+20000,271.0993
gfx938,f8_w8a8_channel,torch.float16,20,352,4096,128,8,0,0,asm,10007+20000,309.4708
gfx938,f8_w8a8_channel,torch.float16,24,352,4096,128,8,0,0,asm,10007+20000,317.0666
gfx938,f8_w8a8_channel,torch.float16,28,352,4096,128,8,0,0,asm,10006+20000,320.9012
gfx938,f8_w8a8_channel,torch.float16,32,352,4096,128,8,0,0,asm,10007+20001,333.1537
gfx938,f8_w8a8_channel,torch.float16,36,352,4096,128,8,0,0,asm,10006+20001,340.7128
gfx938,f8_w8a8_channel,torch.float16,40,352,4096,128,8,0,0,asm,10006+20000,346.6581
gfx938,f8_w8a8_channel,torch.float16,44,352,4096,128,8,0,0,asm,10006+20000,359.2222
gfx938,f8_w8a8_channel,torch.float16,48,352,4096,128,8,0,0,asm,10006+20000,367.6264
gfx938,f8_w8a8_channel,torch.float16,56,352,4096,128,8,0,0,asm,10006+20001,368.0895
gfx938,f8_w8a8_channel,torch.float16,64,352,4096,128,8,0,0,asm,10006+20001,379.8314
gfx938,f8_w8a8_channel,torch.float16,72,352,4096,128,8,0,0,asm,10006+20000,372.8558
gfx938,f8_w8a8_channel,torch.float16,80,352,4096,128,8,0,0,asm,10006+20000,371.9043
gfx938,f8_w8a8_channel,torch.float16,96,352,4096,128,8,0,0,asm,10006+20000,376.7547
gfx938,f8_w8a8_channel,torch.float16,104,352,4096,128,8,0,0,asm,10006+20000,378.9442
gfx938,f8_w8a8_channel,torch.float16,112,352,4096,128,8,0,0,asm,10006+20001,381.2263
gfx938,f8_w8a8_channel,torch.float16,128,352,4096,128,8,0,0,asm,10006+20001,385.3105
gfx938,f8_w8a8_channel,torch.float16,144,352,4096,128,8,0,0,asm,10006+20001,430.5903
gfx938,f8_w8a8_channel,torch.float16,160,352,4096,128,8,0,0,asm,10006+20000,399.4326
gfx938,f8_w8a8_channel,torch.float16,192,352,4096,128,8,0,0,asm,10006+20001,418.3883
gfx938,f8_w8a8_channel,torch.float16,224,352,4096,128,8,0,0,asm,11002+21000,434.2787
gfx938,f8_w8a8_channel,torch.float16,256,352,4096,128,8,0,0,asm,11004+21000,446.9103
gfx938,f8_w8a8_channel,torch.float16,320,352,4096,128,8,0,0,asm,11004+21001,460.9228
gfx938,f8_w8a8_channel,torch.float16,384,352,4096,128,8,0,0,asm,11004+21001,529.2931
gfx938,f8_w8a8_channel,torch.float16,448,352,4096,128,8,0,0,asm,11004+21001,508.83
gfx938,f8_w8a8_channel,torch.float16,512,352,4096,128,8,0,0,asm,11004+21001,554.5308
gfx938,f8_w8a8_channel,torch.float16,768,352,4096,128,8,0,0,asm,12002+22001,625.1664
gfx938,f8_w8a8_channel,torch.float16,896,352,4096,128,8,0,0,asm,12004+22001,665.6967
gfx938,f8_w8a8_channel,torch.float16,960,352,4096,128,8,0,0,asm,12000+22001,710.7071
gfx938,f8_w8a8_channel,torch.float16,1024,352,4096,128,8,0,0,asm,12005+22001,746.8753
gfx938,f8_w8a8_channel,torch.float16,1280,352,4096,128,8,0,0,asm,12001+22001,861.7717
gfx938,f8_w8a8_channel,torch.float16,1536,352,4096,128,8,0,0,asm,12001+22001,918.0662
gfx938,f8_w8a8_channel,torch.float16,1920,352,4096,128,8,0,0,asm,12001+22001,995.969
gfx938,f8_w8a8_channel,torch.float16,2048,352,4096,128,8,0,0,asm,12001+22001,1101.2402
gfx938,f8_w8a8_channel,torch.float16,2304,352,4096,128,8,0,0,asm,12001+22001,1248.389
gfx938,f8_w8a8_channel,torch.float16,2560,352,4096,128,8,0,0,asm,12001+22001,1272.6331
gfx938,f8_w8a8_channel,torch.float16,3072,352,4096,128,8,0,0,asm,13001+23001,1460.7586
gfx938,f8_w8a8_channel,torch.float16,3584,352,4096,128,8,0,0,asm,13001+23001,1532.7836
gfx938,f8_w8a8_channel,torch.float16,3840,352,4096,128,8,0,0,asm,13001+23001,1618.2737
gfx938,f8_w8a8_channel,torch.float16,4096,352,4096,128,8,0,0,asm,13001+23001,1813.9613
gfx938,f8_w8a8_channel,torch.float16,4608,352,4096,128,8,0,0,asm,13001+23001,2081.9939
gfx938,f8_w8a8_channel,torch.float16,5120,352,4096,128,8,0,0,asm,13001+23001,2147.0968
gfx938,f8_w8a8_channel,torch.float16,6144,352,4096,128,8,0,0,asm,13001+23001,2515.8026
gfx938,f8_w8a8_channel,torch.float16,7168,352,4096,128,8,0,0,asm,13001+23001,2873.9653
gfx938,f8_w8a8_channel,torch.float16,8192,352,4096,128,8,0,0,asm,13001+23001,3216.9279
gfx938,f8_w8a8_channel,torch.float16,10240,352,4096,128,8,0,0,asm,13001+23001,3971.7204
gfx938,f8_w8a8_channel,torch.float16,12288,352,4096,128,8,0,0,asm,13001+23001,4688.2562
gfx938,f8_w8a8_channel,torch.float16,16384,352,4096,128,8,0,0,asm,13001+23001,6226.4982
gfx938,f8_w8a8_channel,torch.float16,24576,352,4096,128,8,0,0,asm,13001+23001,8953.0047
gfx938,f8_w8a8_channel,torch.float16,32768,352,4096,128,8,0,0,asm,13001+23001,11870.9884
gfx938,f8_w8a8_channel,torch.float16,1,352,4096,129,9,0,0,asm,10004+20000,66.9906
gfx938,f8_w8a8_channel,torch.float16,2,352,4096,129,9,0,0,asm,10006+20000,93.7946
gfx938,f8_w8a8_channel,torch.float16,4,352,4096,129,9,0,0,asm,10006+20000,135.1756
gfx938,f8_w8a8_channel,torch.float16,6,352,4096,129,9,0,0,asm,10006+20000,169.0953
gfx938,f8_w8a8_channel,torch.float16,8,352,4096,129,9,0,0,asm,10006+20000,206.291
gfx938,f8_w8a8_channel,torch.float16,12,352,4096,129,9,0,0,asm,10006+20000,247.0656
gfx938,f8_w8a8_channel,torch.float16,16,352,4096,129,9,0,0,asm,10006+20000,289.8192
gfx938,f8_w8a8_channel,torch.float16,20,352,4096,129,9,0,0,asm,10007+20000,319.9213
gfx938,f8_w8a8_channel,torch.float16,24,352,4096,129,9,0,0,asm,10006+20000,338.0181
gfx938,f8_w8a8_channel,torch.float16,28,352,4096,129,9,0,0,asm,10006+20000,339.0821
gfx938,f8_w8a8_channel,torch.float16,32,352,4096,129,9,0,0,asm,10006+20000,344.3705
gfx938,f8_w8a8_channel,torch.float16,36,352,4096,129,9,0,0,asm,10006+20000,349.698
gfx938,f8_w8a8_channel,torch.float16,40,352,4096,129,9,0,0,asm,10006+20000,356.6116
gfx938,f8_w8a8_channel,torch.float16,44,352,4096,129,9,0,0,asm,10006+20000,364.4264
gfx938,f8_w8a8_channel,torch.float16,48,352,4096,129,9,0,0,asm,10006+20000,369.5632
gfx938,f8_w8a8_channel,torch.float16,56,352,4096,129,9,0,0,asm,10006+20000,374.7421
gfx938,f8_w8a8_channel,torch.float16,64,352,4096,129,9,0,0,asm,10006+20000,383.0145
gfx938,f8_w8a8_channel,torch.float16,72,352,4096,129,9,0,0,asm,10006+20000,381.8074
gfx938,f8_w8a8_channel,torch.float16,80,352,4096,129,9,0,0,asm,10007+20000,377.8916
gfx938,f8_w8a8_channel,torch.float16,96,352,4096,129,9,0,0,asm,10006+20000,385.0915
gfx938,f8_w8a8_channel,torch.float16,104,352,4096,129,9,0,0,asm,10006+20000,384.6873
gfx938,f8_w8a8_channel,torch.float16,112,352,4096,129,9,0,0,asm,10006+20000,387.6684
gfx938,f8_w8a8_channel,torch.float16,128,352,4096,129,9,0,0,asm,10006+20001,389.6473
gfx938,f8_w8a8_channel,torch.float16,144,352,4096,129,9,0,0,asm,10006+20001,403.0031
gfx938,f8_w8a8_channel,torch.float16,160,352,4096,129,9,0,0,asm,10006+20001,404.7041
gfx938,f8_w8a8_channel,torch.float16,192,352,4096,129,9,0,0,asm,11004+21000,428.0303
gfx938,f8_w8a8_channel,torch.float16,224,352,4096,129,9,0,0,asm,11004+21001,438.6576
gfx938,f8_w8a8_channel,torch.float16,256,352,4096,129,9,0,0,asm,11004+21000,446.2871
gfx938,f8_w8a8_channel,torch.float16,320,352,4096,129,9,0,0,asm,11004+21001,471.8112
gfx938,f8_w8a8_channel,torch.float16,384,352,4096,129,9,0,0,asm,11004+21000,494.91
gfx938,f8_w8a8_channel,torch.float16,448,352,4096,129,9,0,0,asm,11004+21001,535.9625
gfx938,f8_w8a8_channel,torch.float16,512,352,4096,129,9,0,0,asm,12000+22001,566.0424
gfx938,f8_w8a8_channel,torch.float16,768,352,4096,129,9,0,0,asm,12004+22001,633.3263
gfx938,f8_w8a8_channel,torch.float16,896,352,4096,129,9,0,0,asm,12001+22001,714.4207
gfx938,f8_w8a8_channel,torch.float16,960,352,4096,129,9,0,0,asm,12003+22001,785.0646
gfx938,f8_w8a8_channel,torch.float16,1024,352,4096,129,9,0,0,asm,12001+22001,842.2433
gfx938,f8_w8a8_channel,torch.float16,1280,352,4096,129,9,0,0,asm,12001+22001,895.9105
gfx938,f8_w8a8_channel,torch.float16,1536,352,4096,129,9,0,0,asm,12005+22001,955.506
gfx938,f8_w8a8_channel,torch.float16,1920,352,4096,129,9,0,0,asm,12001+22001,1193.5008
gfx938,f8_w8a8_channel,torch.float16,2048,352,4096,129,9,0,0,asm,12001+22001,1239.749
gfx938,f8_w8a8_channel,torch.float16,2304,352,4096,129,9,0,0,asm,12001+22001,1304.8266
gfx938,f8_w8a8_channel,torch.float16,2560,352,4096,129,9,0,0,asm,12001+22001,1346.1569
gfx938,f8_w8a8_channel,torch.float16,3072,352,4096,129,9,0,0,asm,13001+23001,1491.9416
gfx938,f8_w8a8_channel,torch.float16,3584,352,4096,129,9,0,0,asm,13001+23001,1740.909
gfx938,f8_w8a8_channel,torch.float16,3840,352,4096,129,9,0,0,asm,13001+23001,1995.6785
gfx938,f8_w8a8_channel,torch.float16,4096,352,4096,129,9,0,0,asm,13001+23001,2067.636
gfx938,f8_w8a8_channel,torch.float16,4608,352,4096,129,9,0,0,asm,13001+23001,2126.1537
gfx938,f8_w8a8_channel,torch.float16,5120,352,4096,129,9,0,0,asm,13001+23001,2344.7044
gfx938,f8_w8a8_channel,torch.float16,6144,352,4096,129,9,0,0,asm,13001+23001,2914.0914
gfx938,f8_w8a8_channel,torch.float16,7168,352,4096,129,9,0,0,asm,13001+23001,3109.3158
gfx938,f8_w8a8_channel,torch.float16,8192,352,4096,129,9,0,0,asm,13001+23001,3587.9411
gfx938,f8_w8a8_channel,torch.float16,10240,352,4096,129,9,0,0,asm,13001+23001,4377.0662
gfx938,f8_w8a8_channel,torch.float16,12288,352,4096,129,9,0,0,asm,13001+23001,5110.4779
gfx938,f8_w8a8_channel,torch.float16,16384,352,4096,129,9,0,0,asm,13001+23001,6757.208
gfx938,f8_w8a8_channel,torch.float16,24576,352,4096,129,9,0,0,asm,13001+23001,9975.1734
gfx938,f8_w8a8_channel,torch.float16,32768,352,4096,129,9,0,0,asm,13001+23001,13179.6065
gfx936,int8_w8a8_channel,torch.float16,1,384,3072,256,8,0,0,asm,10002+20000,57.8034
gfx936,int8_w8a8_channel,torch.float16,2,384,3072,256,8,0,0,asm,10006+20000,79.9676
gfx936,int8_w8a8_channel,torch.float16,4,384,3072,256,8,0,0,asm,10007+20000,127.3875
gfx936,int8_w8a8_channel,torch.float16,6,384,3072,256,8,0,0,asm,10007+20000,167.0003
gfx936,int8_w8a8_channel,torch.float16,8,384,3072,256,8,0,0,asm,10007+20000,202.6299
gfx936,int8_w8a8_channel,torch.float16,12,384,3072,256,8,0,0,asm,10007+20000,264.5336
gfx936,int8_w8a8_channel,torch.float16,16,384,3072,256,8,0,0,asm,10007+20000,316.8877
gfx936,int8_w8a8_channel,torch.float16,24,384,3072,256,8,0,0,asm,10007+20000,415.3612
gfx936,int8_w8a8_channel,torch.float16,32,384,3072,256,8,0,0,asm,10007+20000,503.9710
gfx936,int8_w8a8_channel,torch.float16,36,384,3072,256,8,0,0,asm,10007+20000,523.2945
gfx936,int8_w8a8_channel,torch.float16,48,384,3072,256,8,0,0,asm,10007+20000,584.4568
gfx936,int8_w8a8_channel,torch.float16,56,384,3072,256,8,0,0,asm,10007+20000,615.8508
gfx936,int8_w8a8_channel,torch.float16,64,384,3072,256,8,0,0,asm,10006+20000,640.557
gfx936,int8_w8a8_channel,torch.float16,72,384,3072,256,8,0,0,asm,10006+20000,664.3161
gfx936,int8_w8a8_channel,torch.float16,80,384,3072,256,8,0,0,asm,10006+20000,687.6761
gfx936,int8_w8a8_channel,torch.float16,88,384,3072,256,8,0,0,asm,10007+20000,708.2149
gfx936,int8_w8a8_channel,torch.float16,96,384,3072,256,8,0,0,asm,10006+20000,716.4591
gfx936,int8_w8a8_channel,torch.float16,100,384,3072,256,8,0,0,asm,10007+20000,721.7644
gfx936,int8_w8a8_channel,torch.float16,112,384,3072,256,8,0,0,asm,10007+20000,734.3622
gfx936,int8_w8a8_channel,torch.float16,128,384,3072,256,8,0,0,asm,10007+20000,751.3221
gfx936,int8_w8a8_channel,torch.float16,144,384,3072,256,8,0,0,asm,10007+20000,759.3304
gfx936,int8_w8a8_channel,torch.float16,160,384,3072,256,8,0,0,asm,10006+20000,767.7599
gfx936,int8_w8a8_channel,torch.float16,192,384,3072,256,8,0,0,asm,10007+20000,782.0504
gfx936,int8_w8a8_channel,torch.float16,224,384,3072,256,8,0,0,asm,10006+20000,795.6587
gfx936,int8_w8a8_channel,torch.float16,256,384,3072,256,8,0,0,asm,10006+20000,804.6354
gfx936,int8_w8a8_channel,torch.float16,320,384,3072,256,8,0,0,asm,10007+20000,830.3447
gfx936,int8_w8a8_channel,torch.float16,384,384,3072,256,8,0,0,asm,11006+21000,854.2437
gfx936,int8_w8a8_channel,torch.float16,448,384,3072,256,8,0,0,asm,11006+21000,872.6016
gfx936,int8_w8a8_channel,torch.float16,512,384,3072,256,8,0,0,asm,11006+21000,887.7257
gfx936,int8_w8a8_channel,torch.float16,640,384,3072,256,8,0,0,asm,11006+21000,921.6457
gfx936,int8_w8a8_channel,torch.float16,768,384,3072,256,8,0,0,asm,11006+21000,952.2567
gfx936,int8_w8a8_channel,torch.float16,896,384,3072,256,8,0,0,asm,12004+22001,1000.5934
gfx936,int8_w8a8_channel,torch.float16,1024,384,3072,256,8,0,0,asm,12004+22001,1024.0714
gfx936,int8_w8a8_channel,torch.float16,1280,384,3072,256,8,0,0,asm,12004+22001,1071.4648
gfx936,int8_w8a8_channel,torch.float16,1536,384,3072,256,8,0,0,asm,12004+22001,1123.8351
gfx936,int8_w8a8_channel,torch.float16,2048,384,3072,256,8,0,0,asm,12005+22001,1284.3736
gfx936,int8_w8a8_channel,torch.float16,2304,384,3072,256,8,0,0,asm,12005+22001,1379.2871
gfx936,int8_w8a8_channel,torch.float16,2560,384,3072,256,8,0,0,asm,13000+23001,1425.6448
gfx936,int8_w8a8_channel,torch.float16,3072,384,3072,256,8,0,0,asm,13000+23001,1514.0309
gfx936,int8_w8a8_channel,torch.float16,3584,384,3072,256,8,0,0,asm,13000+23001,1634.6032
gfx936,int8_w8a8_channel,torch.float16,4096,384,3072,256,8,0,0,asm,13001+23001,1824.514
gfx936,int8_w8a8_channel,torch.float16,5120,384,3072,256,8,0,0,asm,12001+22001,2216.8495
gfx936,int8_w8a8_channel,torch.float16,6144,384,3072,256,8,0,0,asm,13001+23001,2364.4616
gfx936,int8_w8a8_channel,torch.float16,7168,384,3072,256,8,0,0,asm,13001+23001,2538.6083
gfx936,int8_w8a8_channel,torch.float16,8192,384,3072,256,8,0,0,asm,13001+23001,2952.9812
gfx936,int8_w8a8_channel,torch.float16,10240,384,3072,256,8,0,0,asm,13001+23001,3585.1639
gfx936,int8_w8a8_channel,torch.float16,12288,384,3072,256,8,0,0,asm,13001+23001,4181.1698
gfx936,int8_w8a8_channel,torch.float16,16384,384,3072,256,8,0,0,asm,13001+23001,5377.322
gfx936,int8_w8a8_channel,torch.float16,24576,384,3072,256,8,0,0,asm,13001+23001,7906.7003
gfx936,int8_w8a8_channel,torch.float16,32768,384,3072,256,8,0,0,asm,13001+23001,10408.7744
gfx936,int8_w8a8_channel,torch.float16,1,192,3072,256,8,0,0,asm,10006+20000,44.8855
gfx936,int8_w8a8_channel,torch.float16,2,192,3072,256,8,0,0,asm,10009+20000,60.4898
gfx936,int8_w8a8_channel,torch.float16,4,192,3072,256,8,0,0,asm,10013+20000,83.9172
gfx936,int8_w8a8_channel,torch.float16,6,192,3072,256,8,0,0,asm,10006+20000,104.9866
gfx936,int8_w8a8_channel,torch.float16,8,192,3072,256,8,0,0,asm,10009+20001,125.0032
gfx936,int8_w8a8_channel,torch.float16,12,192,3072,256,8,0,0,asm,10010+20000,160.2622
gfx936,int8_w8a8_channel,torch.float16,16,192,3072,256,8,0,0,asm,10006+20000,188.6327
gfx936,int8_w8a8_channel,torch.float16,24,192,3072,256,8,0,0,asm,10007+20001,236.7812
gfx936,int8_w8a8_channel,torch.float16,32,192,3072,256,8,0,0,asm,10007+20001,292.8094
gfx936,int8_w8a8_channel,torch.float16,36,192,3072,256,8,0,0,asm,10007+20001,296.5958
gfx936,int8_w8a8_channel,torch.float16,48,192,3072,256,8,0,0,asm,10007+20000,328.3769
gfx936,int8_w8a8_channel,torch.float16,56,192,3072,256,8,0,0,asm,10007+20001,343.5516
gfx936,int8_w8a8_channel,torch.float16,64,192,3072,256,8,0,0,asm,10007+20001,356.6294
gfx936,int8_w8a8_channel,torch.float16,72,192,3072,256,8,0,0,asm,10007+20001,369.8757
gfx936,int8_w8a8_channel,torch.float16,80,192,3072,256,8,0,0,asm,10006+20001,377.9768
gfx936,int8_w8a8_channel,torch.float16,88,192,3072,256,8,0,0,asm,10006+20001,389.4547
gfx936,int8_w8a8_channel,torch.float16,96,192,3072,256,8,0,0,asm,10006+20000,396.4441
gfx936,int8_w8a8_channel,torch.float16,100,192,3072,256,8,0,0,asm,10007+20000,395.9387
gfx936,int8_w8a8_channel,torch.float16,112,192,3072,256,8,0,0,asm,10007+20001,404.8062
gfx936,int8_w8a8_channel,torch.float16,128,192,3072,256,8,0,0,asm,10006+20000,418.9955
gfx936,int8_w8a8_channel,torch.float16,144,192,3072,256,8,0,0,asm,10006+20001,422.4733
gfx936,int8_w8a8_channel,torch.float16,160,192,3072,256,8,0,0,asm,10006+20001,426.6501
gfx936,int8_w8a8_channel,torch.float16,192,192,3072,256,8,0,0,asm,10006+20001,435.0712
gfx936,int8_w8a8_channel,torch.float16,224,192,3072,256,8,0,0,asm,10006+20001,441.6734
gfx936,int8_w8a8_channel,torch.float16,256,192,3072,256,8,0,0,asm,10006+20001,449.2776
gfx936,int8_w8a8_channel,torch.float16,320,192,3072,256,8,0,0,asm,10007+20001,465.3449
gfx936,int8_w8a8_channel,torch.float16,384,192,3072,256,8,0,0,asm,10007+20001,483.1134
gfx936,int8_w8a8_channel,torch.float16,448,192,3072,256,8,0,0,asm,11006+21001,496.2418
gfx936,int8_w8a8_channel,torch.float16,512,192,3072,256,8,0,0,asm,11006+21001,511.8880
gfx936,int8_w8a8_channel,torch.float16,640,192,3072,256,8,0,0,asm,11006+21001,536.2923
gfx936,int8_w8a8_channel,torch.float16,768,192,3072,256,8,0,0,asm,11006+21001,565.488
gfx936,int8_w8a8_channel,torch.float16,896,192,3072,256,8,0,0,asm,11004+21001,592.8648
gfx936,int8_w8a8_channel,torch.float16,1024,192,3072,256,8,0,0,asm,11004+21001,632.0227
gfx936,int8_w8a8_channel,torch.float16,1280,192,3072,256,8,0,0,asm,12004+22001,678.2626
gfx936,int8_w8a8_channel,torch.float16,1536,192,3072,256,8,0,0,asm,12004+22001,721.7235
gfx936,int8_w8a8_channel,torch.float16,2048,192,3072,256,8,0,0,asm,12000+22001,866.7338
gfx936,int8_w8a8_channel,torch.float16,2304,192,3072,256,8,0,0,asm,13001+23001,968.9905
gfx936,int8_w8a8_channel,torch.float16,2560,192,3072,256,8,0,0,asm,13001+23001,1005.2935
gfx936,int8_w8a8_channel,torch.float16,3072,192,3072,256,8,0,0,asm,13000+23001,1075.8535
gfx936,int8_w8a8_channel,torch.float16,3584,192,3072,256,8,0,0,asm,13001+23001,1161.3776
gfx936,int8_w8a8_channel,torch.float16,4096,192,3072,256,8,0,0,asm,13001+23001,1384.6193
gfx936,int8_w8a8_channel,torch.float16,5120,192,3072,256,8,0,0,asm,12000+22001,1677.0231
gfx936,int8_w8a8_channel,torch.float16,6144,192,3072,256,8,0,0,asm,13001+23001,1893.4521
gfx936,int8_w8a8_channel,torch.float16,7168,192,3072,256,8,0,0,asm,13001+23001,2042.8661
gfx936,int8_w8a8_channel,torch.float16,8192,192,3072,256,8,0,0,asm,13001+23001,2372.4733
gfx936,int8_w8a8_channel,torch.float16,10240,192,3072,256,8,0,0,asm,13001+23001,2884.8177
gfx936,int8_w8a8_channel,torch.float16,12288,192,3072,256,8,0,0,asm,13001+23001,3381.5416
gfx936,int8_w8a8_channel,torch.float16,16384,192,3072,256,8,0,0,asm,13001+23001,4384.9761
gfx936,int8_w8a8_channel,torch.float16,24576,192,3072,256,8,0,0,asm,13001+23001,6428.7541
gfx936,int8_w8a8_channel,torch.float16,32768,192,3072,256,8,0,0,asm,13001+23001,8504.9194
gfx936,int8_w8a8_channel,torch.float16,1,192,5120,160,8,0,0,asm,10006+20000,52.2624
gfx936,int8_w8a8_channel,torch.float16,2,192,5120,160,8,0,0,asm,10009+20000,70.2834
gfx936,int8_w8a8_channel,torch.float16,4,192,5120,160,8,0,0,asm,10002+20000,103.8327
gfx936,int8_w8a8_channel,torch.float16,6,192,5120,160,8,0,0,asm,10007+20000,139.0834
gfx936,int8_w8a8_channel,torch.float16,8,192,5120,160,8,0,0,asm,10007+20000,171.4032
gfx936,int8_w8a8_channel,torch.float16,12,192,5120,160,8,0,0,asm,10007+20001,233.6516
gfx936,int8_w8a8_channel,torch.float16,16,192,5120,160,8,0,0,asm,10007+20000,268.1862
gfx936,int8_w8a8_channel,torch.float16,24,192,5120,160,8,0,0,asm,10007+20001,321.5474
gfx936,int8_w8a8_channel,torch.float16,32,192,5120,160,8,0,0,asm,10007+20001,362.0808
gfx936,int8_w8a8_channel,torch.float16,36,192,5120,160,8,0,0,asm,10006+20001,372.5115
gfx936,int8_w8a8_channel,torch.float16,48,192,5120,160,8,0,0,asm,10007+20000,397.1009
gfx936,int8_w8a8_channel,torch.float16,56,192,5120,160,8,0,0,asm,10007+20000,410.7262
gfx936,int8_w8a8_channel,torch.float16,64,192,5120,160,8,0,0,asm,10007+20000,416.1324
gfx936,int8_w8a8_channel,torch.float16,72,192,5120,160,8,0,0,asm,10007+20001,423.3745
gfx936,int8_w8a8_channel,torch.float16,80,192,5120,160,8,0,0,asm,10007+20000,430.4229
gfx936,int8_w8a8_channel,torch.float16,88,192,5120,160,8,0,0,asm,10007+20001,432.8483
gfx936,int8_w8a8_channel,torch.float16,96,192,5120,160,8,0,0,asm,10006+20001,437.564
gfx936,int8_w8a8_channel,torch.float16,100,192,5120,160,8,0,0,asm,10001+20001,439.9303
gfx936,int8_w8a8_channel,torch.float16,112,192,5120,160,8,0,0,asm,10006+20001,443.0629
gfx936,int8_w8a8_channel,torch.float16,128,192,5120,160,8,0,0,asm,10006+20001,446.1113
gfx936,int8_w8a8_channel,torch.float16,144,192,5120,160,8,0,0,asm,10007+20001,452.2587
gfx936,int8_w8a8_channel,torch.float16,160,192,5120,160,8,0,0,asm,10006+20001,457.2608
gfx936,int8_w8a8_channel,torch.float16,192,192,5120,160,8,0,0,asm,10006+20001,466.7092
gfx936,int8_w8a8_channel,torch.float16,224,192,5120,160,8,0,0,asm,10006+20001,476.2418
gfx936,int8_w8a8_channel,torch.float16,256,192,5120,160,8,0,0,asm,10006+20001,490.3724
gfx936,int8_w8a8_channel,torch.float16,320,192,5120,160,8,0,0,asm,11006+21001,506.7597
gfx936,int8_w8a8_channel,torch.float16,384,192,5120,160,8,0,0,asm,11006+21001,525.1344
gfx936,int8_w8a8_channel,torch.float16,448,192,5120,160,8,0,0,asm,11006+21001,540.646
gfx936,int8_w8a8_channel,torch.float16,512,192,5120,160,8,0,0,asm,11006+21001,575.2648
gfx936,int8_w8a8_channel,torch.float16,640,192,5120,160,8,0,0,asm,12004+22001,626.5237
gfx936,int8_w8a8_channel,torch.float16,768,192,5120,160,8,0,0,asm,12004+22001,656.4268
gfx936,int8_w8a8_channel,torch.float16,896,192,5120,160,8,0,0,asm,12004+22001,681.1089
gfx936,int8_w8a8_channel,torch.float16,1024,192,5120,160,8,0,0,asm,12004+22001,722.4309
gfx936,int8_w8a8_channel,torch.float16,1280,192,5120,160,8,0,0,asm,12004+22001,840.5107
gfx936,int8_w8a8_channel,torch.float16,1536,192,5120,160,8,0,0,asm,13001+23001,962.6073
gfx936,int8_w8a8_channel,torch.float16,2048,192,5120,160,8,0,0,asm,13001+23001,1058.4304
gfx936,int8_w8a8_channel,torch.float16,2304,192,5120,160,8,0,0,asm,13001+23001,1153.0744
gfx936,int8_w8a8_channel,torch.float16,2560,192,5120,160,8,0,0,asm,12001+22001,1339.7014
gfx936,int8_w8a8_channel,torch.float16,3072,192,5120,160,8,0,0,asm,12001+22001,1563.2211
gfx936,int8_w8a8_channel,torch.float16,3584,192,5120,160,8,0,0,asm,12001+22001,1709.4608
gfx936,int8_w8a8_channel,torch.float16,4096,192,5120,160,8,0,0,asm,13001+23001,1842.4543
gfx936,int8_w8a8_channel,torch.float16,5120,192,5120,160,8,0,0,asm,13001+23001,2276.4578
gfx936,int8_w8a8_channel,torch.float16,6144,192,5120,160,8,0,0,asm,13001+23001,2694.0318
gfx936,int8_w8a8_channel,torch.float16,7168,192,5120,160,8,0,0,asm,13001+23001,2929.3831
gfx936,int8_w8a8_channel,torch.float16,8192,192,5120,160,8,0,0,asm,13001+23001,3537.1883
gfx936,int8_w8a8_channel,torch.float16,10240,192,5120,160,8,0,0,asm,13001+23001,4197.0934
gfx936,int8_w8a8_channel,torch.float16,12288,192,5120,160,8,0,0,asm,13001+23001,4879.3646
gfx936,int8_w8a8_channel,torch.float16,16384,192,5120,160,8,0,0,asm,13001+23001,6534.0736
gfx936,int8_w8a8_channel,torch.float16,24576,192,5120,160,8,0,0,asm,13001+23001,9540.3264
gfx936,int8_w8a8_channel,torch.float16,32768,192,5120,160,8,0,0,asm,13001+23001,12666.0375
gfx936,int8_w8a8_channel,torch.float16,1,96,5120,160,8,0,0,asm,10001+20000,42.0897
gfx936,int8_w8a8_channel,torch.float16,2,96,5120,160,8,0,0,asm,10006+20001,51.6561
gfx936,int8_w8a8_channel,torch.float16,4,96,5120,160,8,0,0,asm,10010+20001,71.9255
gfx936,int8_w8a8_channel,torch.float16,6,96,5120,160,8,0,0,asm,10011+20001,89.837
gfx936,int8_w8a8_channel,torch.float16,8,96,5120,160,8,0,0,asm,10013+20001,105.9211
gfx936,int8_w8a8_channel,torch.float16,12,96,5120,160,8,0,0,asm,10006+20001,143.3947
gfx936,int8_w8a8_channel,torch.float16,16,96,5120,160,8,0,0,asm,10006+20001,162.0727
gfx936,int8_w8a8_channel,torch.float16,24,96,5120,160,8,0,0,asm,10006+20001,189.3033
gfx936,int8_w8a8_channel,torch.float16,32,96,5120,160,8,0,0,asm,10007+20001,215.8915
gfx936,int8_w8a8_channel,torch.float16,36,96,5120,160,8,0,0,asm,10006+20001,217.2443
gfx936,int8_w8a8_channel,torch.float16,48,96,5120,160,8,0,0,asm,10006+20001,230.3644
gfx936,int8_w8a8_channel,torch.float16,56,96,5120,160,8,0,0,asm,10008+20001,241.438
gfx936,int8_w8a8_channel,torch.float16,64,96,5120,160,8,0,0,asm,10008+20001,246.0443
gfx936,int8_w8a8_channel,torch.float16,72,96,5120,160,8,0,0,asm,10007+20001,248.8653
gfx936,int8_w8a8_channel,torch.float16,80,96,5120,160,8,0,0,asm,10007+20001,252.1325
gfx936,int8_w8a8_channel,torch.float16,88,96,5120,160,8,0,0,asm,10007+20001,253.3452
gfx936,int8_w8a8_channel,torch.float16,96,96,5120,160,8,0,0,asm,10007+20001,254.6589
gfx936,int8_w8a8_channel,torch.float16,100,96,5120,160,8,0,0,asm,10007+20001,258.5915
gfx936,int8_w8a8_channel,torch.float16,112,96,5120,160,8,0,0,asm,10010+20001,261.1095
gfx936,int8_w8a8_channel,torch.float16,128,96,5120,160,8,0,0,asm,10008+20001,265.8504
gfx936,int8_w8a8_channel,torch.float16,144,96,5120,160,8,0,0,asm,10006+20001,273.5389
gfx936,int8_w8a8_channel,torch.float16,160,96,5120,160,8,0,0,asm,10006+20001,276.6042
gfx936,int8_w8a8_channel,torch.float16,192,96,5120,160,8,0,0,asm,10006+20001,282.76
gfx936,int8_w8a8_channel,torch.float16,224,96,5120,160,8,0,0,asm,10006+20001,293.7663
gfx936,int8_w8a8_channel,torch.float16,256,96,5120,160,8,0,0,asm,10013+20001,302.4736
gfx936,int8_w8a8_channel,torch.float16,320,96,5120,160,8,0,0,asm,11004+21001,321.4126
gfx936,int8_w8a8_channel,torch.float16,384,96,5120,160,8,0,0,asm,11007+21001,337.4463
gfx936,int8_w8a8_channel,torch.float16,448,96,5120,160,8,0,0,asm,11007+21001,347.8715
gfx936,int8_w8a8_channel,torch.float16,512,96,5120,160,8,0,0,asm,11005+21001,372.8314
gfx936,int8_w8a8_channel,torch.float16,640,96,5120,160,8,0,0,asm,11005+21001,421.7914
gfx936,int8_w8a8_channel,torch.float16,768,96,5120,160,8,0,0,asm,12004+22001,469.1428
gfx936,int8_w8a8_channel,torch.float16,896,96,5120,160,8,0,0,asm,12005+22001,493.4038
gfx936,int8_w8a8_channel,torch.float16,1024,96,5120,160,8,0,0,asm,12005+22001,519.3238
gfx936,int8_w8a8_channel,torch.float16,1280,96,5120,160,8,0,0,asm,12005+22001,622.8689
gfx936,int8_w8a8_channel,torch.float16,1536,96,5120,160,8,0,0,asm,12001+22001,744.5023
gfx936,int8_w8a8_channel,torch.float16,2048,96,5120,160,8,0,0,asm,13001+23001,832.9569
gfx936,int8_w8a8_channel,torch.float16,2304,96,5120,160,8,0,0,asm,13001+23001,898.0432
gfx936,int8_w8a8_channel,torch.float16,2560,96,5120,160,8,0,0,asm,12001+22001,1039.8702
gfx936,int8_w8a8_channel,torch.float16,3072,96,5120,160,8,0,0,asm,12005+22001,1214.0004
gfx936,int8_w8a8_channel,torch.float16,3584,96,5120,160,8,0,0,asm,12005+22001,1325.1582
gfx936,int8_w8a8_channel,torch.float16,4096,96,5120,160,8,0,0,asm,13001+23001,1482.2526
gfx936,int8_w8a8_channel,torch.float16,5120,96,5120,160,8,0,0,asm,13001+23001,1854.3025
gfx936,int8_w8a8_channel,torch.float16,6144,96,5120,160,8,0,0,asm,13001+23001,2196.5587
gfx936,int8_w8a8_channel,torch.float16,7168,96,5120,160,8,0,0,asm,13001+23001,2383.1689
gfx936,int8_w8a8_channel,torch.float16,8192,96,5120,160,8,0,0,asm,13001+23001,2855.7492
gfx936,int8_w8a8_channel,torch.float16,10240,96,5120,160,8,0,0,asm,13001+23001,3437.3146
gfx936,int8_w8a8_channel,torch.float16,12288,96,5120,160,8,0,0,asm,13001+23001,3987.7221
gfx936,int8_w8a8_channel,torch.float16,16384,96,5120,160,8,0,0,asm,13001+23001,5349.7577
gfx936,int8_w8a8_channel,torch.float16,24576,96,5120,160,8,0,0,asm,13001+23001,7825.0634
gfx936,int8_w8a8_channel,torch.float16,32768,96,5120,160,8,0,0,asm,13001+23001,10289.2112
gfx936,int8_w8a8_channel,torch.float16,1,192,4096,128,8,0,0,asm,10001+20000,49.4919
gfx936,int8_w8a8_channel,torch.float16,2,192,4096,128,8,0,0,asm,10003+20000,66.0476
gfx936,int8_w8a8_channel,torch.float16,4,192,4096,128,8,0,0,asm,10001+20000,94.2496
gfx936,int8_w8a8_channel,torch.float16,6,192,4096,128,8,0,0,asm,10004+20001,120.3632
gfx936,int8_w8a8_channel,torch.float16,8,192,4096,128,8,0,0,asm,10001+20000,143.3105
gfx936,int8_w8a8_channel,torch.float16,12,192,4096,128,8,0,0,asm,10001+20000,180.2621
gfx936,int8_w8a8_channel,torch.float16,16,192,4096,128,8,0,0,asm,10004+20000,208.0346
gfx936,int8_w8a8_channel,torch.float16,24,192,4096,128,8,0,0,asm,10001+20000,239.1557
gfx936,int8_w8a8_channel,torch.float16,32,192,4096,128,8,0,0,asm,10001+20001,259.3861
gfx936,int8_w8a8_channel,torch.float16,36,192,4096,128,8,0,0,asm,10001+20000,264.5032
gfx936,int8_w8a8_channel,torch.float16,48,192,4096,128,8,0,0,asm,10001+20001,291.3578
gfx936,int8_w8a8_channel,torch.float16,56,192,4096,128,8,0,0,asm,10001+20000,291.1558
gfx936,int8_w8a8_channel,torch.float16,64,192,4096,128,8,0,0,asm,10001+20000,306.3335
gfx936,int8_w8a8_channel,torch.float16,72,192,4096,128,8,0,0,asm,10001+20000,297.4295
gfx936,int8_w8a8_channel,torch.float16,80,192,4096,128,8,0,0,asm,10001+20000,300.5621
gfx936,int8_w8a8_channel,torch.float16,88,192,4096,128,8,0,0,asm,10001+20000,303.5936
gfx936,int8_w8a8_channel,torch.float16,96,192,4096,128,8,0,0,asm,10001+20000,305.0337
gfx936,int8_w8a8_channel,torch.float16,100,192,4096,128,8,0,0,asm,10001+20000,306.1537
gfx936,int8_w8a8_channel,torch.float16,112,192,4096,128,8,0,0,asm,10001+20000,308.8231
gfx936,int8_w8a8_channel,torch.float16,128,192,4096,128,8,0,0,asm,10001+20001,313.1853
gfx936,int8_w8a8_channel,torch.float16,144,192,4096,128,8,0,0,asm,10001+20001,319.6357
gfx936,int8_w8a8_channel,torch.float16,160,192,4096,128,8,0,0,asm,10001+20001,324.4863
gfx936,int8_w8a8_channel,torch.float16,192,192,4096,128,8,0,0,asm,10006+20001,338.3978
gfx936,int8_w8a8_channel,torch.float16,224,192,4096,128,8,0,0,asm,10007+20001,351.7957
gfx936,int8_w8a8_channel,torch.float16,256,192,4096,128,8,0,0,asm,10007+20001,364.2756
gfx936,int8_w8a8_channel,torch.float16,320,192,4096,128,8,0,0,asm,11000+21001,388.1662
gfx936,int8_w8a8_channel,torch.float16,384,192,4096,128,8,0,0,asm,11000+21001,406.0188
gfx936,int8_w8a8_channel,torch.float16,448,192,4096,128,8,0,0,asm,11006+21001,425.2861
gfx936,int8_w8a8_channel,torch.float16,512,192,4096,128,8,0,0,asm,11006+21001,446.7596
gfx936,int8_w8a8_channel,torch.float16,640,192,4096,128,8,0,0,asm,11004+21001,495.1384
gfx936,int8_w8a8_channel,torch.float16,768,192,4096,128,8,0,0,asm,12004+22001,529.7151
gfx936,int8_w8a8_channel,torch.float16,896,192,4096,128,8,0,0,asm,12004+22001,549.2014
gfx936,int8_w8a8_channel,torch.float16,1024,192,4096,128,8,0,0,asm,12004+22001,599.2392
gfx936,int8_w8a8_channel,torch.float16,1280,192,4096,128,8,0,0,asm,12001+22001,711.3232
gfx936,int8_w8a8_channel,torch.float16,1536,192,4096,128,8,0,0,asm,12001+22001,757.8579
gfx936,int8_w8a8_channel,torch.float16,2048,192,4096,128,8,0,0,asm,12001+22001,912.6535
gfx936,int8_w8a8_channel,torch.float16,2304,192,4096,128,8,0,0,asm,12001+22001,1026.4976
gfx936,int8_w8a8_channel,torch.float16,2560,192,4096,128,8,0,0,asm,12001+22001,1080.5522
gfx936,int8_w8a8_channel,torch.float16,3072,192,4096,128,8,0,0,asm,13001+23001,1229.0909
gfx936,int8_w8a8_channel,torch.float16,3584,192,4096,128,8,0,0,asm,13001+23001,1326.9518
gfx936,int8_w8a8_channel,torch.float16,4096,192,4096,128,8,0,0,asm,13001+23001,1519.4988
gfx936,int8_w8a8_channel,torch.float16,5120,192,4096,128,8,0,0,asm,13001+23001,1839.1447
gfx936,int8_w8a8_channel,torch.float16,6144,192,4096,128,8,0,0,asm,13001+23001,2176.0198
gfx936,int8_w8a8_channel,torch.float16,7168,192,4096,128,8,0,0,asm,13001+23001,2477.9225
gfx936,int8_w8a8_channel,torch.float16,8192,192,4096,128,8,0,0,asm,13001+23001,2777.7368
gfx936,int8_w8a8_channel,torch.float16,10240,192,4096,128,8,0,0,asm,13001+23001,3406.7548
gfx936,int8_w8a8_channel,torch.float16,12288,192,4096,128,8,0,0,asm,13001+23001,4037.6253
gfx936,int8_w8a8_channel,torch.float16,16384,192,4096,128,8,0,0,asm,13001+23001,5310.6843
gfx936,int8_w8a8_channel,torch.float16,24576,192,4096,128,8,0,0,asm,13001+23001,7871.7663
gfx936,int8_w8a8_channel,torch.float16,32768,192,4096,128,8,0,0,asm,13001+23001,10420.6629
gfx936,int8_w8a8_channel,torch.float16,1,96,4096,128,8,0,0,asm,10000+20001,39.8919
gfx936,int8_w8a8_channel,torch.float16,2,96,4096,128,8,0,0,asm,10000+20001,51.8832
gfx936,int8_w8a8_channel,torch.float16,4,96,4096,128,8,0,0,asm,10001+20001,68.3214
gfx936,int8_w8a8_channel,torch.float16,6,96,4096,128,8,0,0,asm,10004+20001,83.2014
gfx936,int8_w8a8_channel,torch.float16,8,96,4096,128,8,0,0,asm,10001+20001,94.8645
gfx936,int8_w8a8_channel,torch.float16,12,96,4096,128,8,0,0,asm,10001+20001,118.1485
gfx936,int8_w8a8_channel,torch.float16,16,96,4096,128,8,0,0,asm,10001+20001,135.2013
gfx936,int8_w8a8_channel,torch.float16,24,96,4096,128,8,0,0,asm,10001+20001,151.198
gfx936,int8_w8a8_channel,torch.float16,32,96,4096,128,8,0,0,asm,10001+20001,163.2264
gfx936,int8_w8a8_channel,torch.float16,36,96,4096,128,8,0,0,asm,10001+20001,160.5708
gfx936,int8_w8a8_channel,torch.float16,48,96,4096,128,8,0,0,asm,10001+20001,177.8002
gfx936,int8_w8a8_channel,torch.float16,56,96,4096,128,8,0,0,asm,10001+20001,178.8275
gfx936,int8_w8a8_channel,torch.float16,64,96,4096,128,8,0,0,asm,10001+20001,193.2052
gfx936,int8_w8a8_channel,torch.float16,72,96,4096,128,8,0,0,asm,10001+20001,184.4949
gfx936,int8_w8a8_channel,torch.float16,80,96,4096,128,8,0,0,asm,10001+20001,183.1728
gfx936,int8_w8a8_channel,torch.float16,88,96,4096,128,8,0,0,asm,10001+20001,186.7517
gfx936,int8_w8a8_channel,torch.float16,96,96,4096,128,8,0,0,asm,10001+20001,190.8023
gfx936,int8_w8a8_channel,torch.float16,100,96,4096,128,8,0,0,asm,10001+20001,188.0907
gfx936,int8_w8a8_channel,torch.float16,112,96,4096,128,8,0,0,asm,10001+20001,191.3074
gfx936,int8_w8a8_channel,torch.float16,128,96,4096,128,8,0,0,asm,10001+20001,197.4464
gfx936,int8_w8a8_channel,torch.float16,144,96,4096,128,8,0,0,asm,10001+20001,198.1539
gfx936,int8_w8a8_channel,torch.float16,160,96,4096,128,8,0,0,asm,10001+20001,203.0464
gfx936,int8_w8a8_channel,torch.float16,192,96,4096,128,8,0,0,asm,10004+20001,212.4527
gfx936,int8_w8a8_channel,torch.float16,224,96,4096,128,8,0,0,asm,10006+20001,227.6695
gfx936,int8_w8a8_channel,torch.float16,256,96,4096,128,8,0,0,asm,10006+20001,235.0968
gfx936,int8_w8a8_channel,torch.float16,320,96,4096,128,8,0,0,asm,11000+21001,257.539
gfx936,int8_w8a8_channel,torch.float16,384,96,4096,128,8,0,0,asm,11000+21001,269.9684
gfx936,int8_w8a8_channel,torch.float16,448,96,4096,128,8,0,0,asm,11004+21001,284.2084
gfx936,int8_w8a8_channel,torch.float16,512,96,4096,128,8,0,0,asm,11004+21001,309.8589
gfx936,int8_w8a8_channel,torch.float16,640,96,4096,128,8,0,0,asm,12004+22001,353.4631
gfx936,int8_w8a8_channel,torch.float16,768,96,4096,128,8,0,0,asm,12004+22001,373.0925
gfx936,int8_w8a8_channel,torch.float16,896,96,4096,128,8,0,0,asm,12000+22001,399.3156
gfx936,int8_w8a8_channel,torch.float16,1024,96,4096,128,8,0,0,asm,12000+22001,445.0587
gfx936,int8_w8a8_channel,torch.float16,1280,96,4096,128,8,0,0,asm,11005+21001,529.2775
gfx936,int8_w8a8_channel,torch.float16,1536,96,4096,128,8,0,0,asm,12005+22001,581.3195
gfx936,int8_w8a8_channel,torch.float16,2048,96,4096,128,8,0,0,asm,12005+22001,703.7529
gfx936,int8_w8a8_channel,torch.float16,2304,96,4096,128,8,0,0,asm,12005+22001,797.5802
gfx936,int8_w8a8_channel,torch.float16,2560,96,4096,128,8,0,0,asm,12005+22001,838.2538
gfx936,int8_w8a8_channel,torch.float16,3072,96,4096,128,8,0,0,asm,12001+22001,962.8515
gfx936,int8_w8a8_channel,torch.float16,3584,96,4096,128,8,0,0,asm,13001+23000,1089.4702
gfx936,int8_w8a8_channel,torch.float16,4096,96,4096,128,8,0,0,asm,13001+23001,1229.4868
gfx936,int8_w8a8_channel,torch.float16,5120,96,4096,128,8,0,0,asm,13001+23001,1491.0864
gfx936,int8_w8a8_channel,torch.float16,6144,96,4096,128,8,0,0,asm,13001+23001,1771.3386
gfx936,int8_w8a8_channel,torch.float16,7168,96,4096,128,8,0,0,asm,13001+23001,1998.9508
gfx936,int8_w8a8_channel,torch.float16,8192,96,4096,128,8,0,0,asm,13001+23001,2247.9693
gfx936,int8_w8a8_channel,torch.float16,10240,96,4096,128,8,0,0,asm,13001+23001,2772.4906
gfx936,int8_w8a8_channel,torch.float16,12288,96,4096,128,8,0,0,asm,13001+23001,3282.9993
gfx936,int8_w8a8_channel,torch.float16,16384,96,4096,128,8,0,0,asm,13001+23001,4321.1449
gfx936,int8_w8a8_channel,torch.float16,24576,96,4096,128,8,0,0,asm,13001+23001,6393.1752
gfx936,int8_w8a8_channel,torch.float16,32768,96,4096,128,8,0,0,asm,13001+23001,8450.1147
gfx936,int8_w8a8_channel,torch.float16,1,256,3072,256,8,0,0,asm,10002+20000,48.5319
gfx936,int8_w8a8_channel,torch.float16,2,256,3072,256,8,0,0,asm,10009+20000,64.8519
gfx936,int8_w8a8_channel,torch.float16,4,256,3072,256,8,0,0,asm,10006+20000,97.4833
gfx936,int8_w8a8_channel,torch.float16,6,256,3072,256,8,0,0,asm,10009+20000,123.5382
gfx936,int8_w8a8_channel,torch.float16,8,256,3072,256,8,0,0,asm,10007+20000,148.1611
gfx936,int8_w8a8_channel,torch.float16,12,256,3072,256,8,0,0,asm,10007+20001,195.8077
gfx936,int8_w8a8_channel,torch.float16,16,256,3072,256,8,0,0,asm,10007+20000,230.0055
gfx936,int8_w8a8_channel,torch.float16,24,256,3072,256,8,0,0,asm,10007+20001,293.6989
gfx936,int8_w8a8_channel,torch.float16,32,256,3072,256,8,0,0,asm,10007+20001,360.8176
gfx936,int8_w8a8_channel,torch.float16,36,256,3072,256,8,0,0,asm,10007+20001,368.5452
gfx936,int8_w8a8_channel,torch.float16,48,256,3072,256,8,0,0,asm,10007+20000,410.6672
gfx936,int8_w8a8_channel,torch.float16,56,256,3072,256,8,0,0,asm,10007+20001,434.7514
gfx936,int8_w8a8_channel,torch.float16,64,256,3072,256,8,0,0,asm,10006+20000,449.4966
gfx936,int8_w8a8_channel,torch.float16,72,256,3072,256,8,0,0,asm,10007+20001,465.8249
gfx936,int8_w8a8_channel,torch.float16,80,256,3072,256,8,0,0,asm,10007+20001,480.9155
gfx936,int8_w8a8_channel,torch.float16,88,256,3072,256,8,0,0,asm,10006+20001,495.1807
gfx936,int8_w8a8_channel,torch.float16,96,256,3072,256,8,0,0,asm,10007+20001,504.3090
gfx936,int8_w8a8_channel,torch.float16,100,256,3072,256,8,0,0,asm,10006+20001,503.5680
gfx936,int8_w8a8_channel,torch.float16,112,256,3072,256,8,0,0,asm,10007+20001,513.446
gfx936,int8_w8a8_channel,torch.float16,128,256,3072,256,8,0,0,asm,10006+20001,526.3723
gfx936,int8_w8a8_channel,torch.float16,144,256,3072,256,8,0,0,asm,10006+20001,532.8817
gfx936,int8_w8a8_channel,torch.float16,160,256,3072,256,8,0,0,asm,10007+20001,539.686
gfx936,int8_w8a8_channel,torch.float16,192,256,3072,256,8,0,0,asm,10006+20001,547.0795
gfx936,int8_w8a8_channel,torch.float16,224,256,3072,256,8,0,0,asm,10006+20001,557.4037
gfx936,int8_w8a8_channel,torch.float16,256,256,3072,256,8,0,0,asm,10006+20001,565.4795
gfx936,int8_w8a8_channel,torch.float16,320,256,3072,256,8,0,0,asm,10006+20001,582.7006
gfx936,int8_w8a8_channel,torch.float16,384,256,3072,256,8,0,0,asm,11006+21001,602.8521
gfx936,int8_w8a8_channel,torch.float16,448,256,3072,256,8,0,0,asm,11006+21001,615.5257
gfx936,int8_w8a8_channel,torch.float16,512,256,3072,256,8,0,0,asm,11006+21001,632.2499
gfx936,int8_w8a8_channel,torch.float16,640,256,3072,256,8,0,0,asm,11006+21001,656.0731
gfx936,int8_w8a8_channel,torch.float16,768,256,3072,256,8,0,0,asm,11006+21001,683.6183
gfx936,int8_w8a8_channel,torch.float16,896,256,3072,256,8,0,0,asm,11007+21001,723.3656
gfx936,int8_w8a8_channel,torch.float16,1024,256,3072,256,8,0,0,asm,11007+21001,757.1508
gfx936,int8_w8a8_channel,torch.float16,1280,256,3072,256,8,0,0,asm,12004+22001,816.3592
gfx936,int8_w8a8_channel,torch.float16,1536,256,3072,256,8,0,0,asm,12004+22001,862.9191
gfx936,int8_w8a8_channel,torch.float16,2048,256,3072,256,8,0,0,asm,12005+22001,1002.9019
gfx936,int8_w8a8_channel,torch.float16,2304,256,3072,256,8,0,0,asm,12005+22001,1086.3881
gfx936,int8_w8a8_channel,torch.float16,2560,256,3072,256,8,0,0,asm,13000+23001,1128.3502
gfx936,int8_w8a8_channel,torch.float16,3072,256,3072,256,8,0,0,asm,13000+23001,1204.3164
gfx936,int8_w8a8_channel,torch.float16,3584,256,3072,256,8,0,0,asm,13000+23001,1307.5498
gfx936,int8_w8a8_channel,torch.float16,4096,256,3072,256,8,0,0,asm,13001+23001,1488.3075
gfx936,int8_w8a8_channel,torch.float16,5120,256,3072,256,8,0,0,asm,12001+22001,1775.8017
gfx936,int8_w8a8_channel,torch.float16,6144,256,3072,256,8,0,0,asm,13001+23001,1976.7277
gfx936,int8_w8a8_channel,torch.float16,7168,256,3072,256,8,0,0,asm,13001+23001,2122.9169
gfx936,int8_w8a8_channel,torch.float16,8192,256,3072,256,8,0,0,asm,13001+23001,2456.4827
gfx936,int8_w8a8_channel,torch.float16,10240,256,3072,256,8,0,0,asm,13001+23001,2976.8103
gfx936,int8_w8a8_channel,torch.float16,12288,256,3072,256,8,0,0,asm,13001+23001,3479.6053
gfx936,int8_w8a8_channel,torch.float16,16384,256,3072,256,8,0,0,asm,13001+23001,4491.6122
gfx936,int8_w8a8_channel,torch.float16,24576,256,3072,256,8,0,0,asm,13001+23001,6587.6761
gfx936,int8_w8a8_channel,torch.float16,32768,256,3072,256,8,0,0,asm,13001+23001,8660.7336
gfx936,int8_w8a8_channel,torch.float16,1,128,3072,256,8,0,0,asm,10000+20000,44.8266
gfx936,int8_w8a8_channel,torch.float16,2,128,3072,256,8,0,0,asm,10002+20100,54.0391
gfx936,int8_w8a8_channel,torch.float16,4,128,3072,256,8,0,0,asm,10002+20101,69.913
gfx936,int8_w8a8_channel,torch.float16,6,128,3072,256,8,0,0,asm,10006+20102,85.8454
gfx936,int8_w8a8_channel,torch.float16,8,128,3072,256,8,0,0,asm,10009+20102,100.2034
gfx936,int8_w8a8_channel,torch.float16,12,128,3072,256,8,0,0,asm,10006+20001,127.706
gfx936,int8_w8a8_channel,torch.float16,16,128,3072,256,8,0,0,asm,10007+20001,146.0643
gfx936,int8_w8a8_channel,torch.float16,24,128,3072,256,8,0,0,asm,10007+20001,178.3224
gfx936,int8_w8a8_channel,torch.float16,32,128,3072,256,8,0,0,asm,10006+20001,222.8306
gfx936,int8_w8a8_channel,torch.float16,36,128,3072,256,8,0,0,asm,10007+20001,218.6591
gfx936,int8_w8a8_channel,torch.float16,48,128,3072,256,8,0,0,asm,10007+20001,238.2969
gfx936,int8_w8a8_channel,torch.float16,56,128,3072,256,8,0,0,asm,10007+20001,252.3937
gfx936,int8_w8a8_channel,torch.float16,64,128,3072,256,8,0,0,asm,10007+20001,262.6758
gfx936,int8_w8a8_channel,torch.float16,72,128,3072,256,8,0,0,asm,10007+20001,271.4337
gfx936,int8_w8a8_channel,torch.float16,80,128,3072,256,8,0,0,asm,10007+20001,281.4379
gfx936,int8_w8a8_channel,torch.float16,88,128,3072,256,8,0,0,asm,10007+20001,285.7495
gfx936,int8_w8a8_channel,torch.float16,96,128,3072,256,8,0,0,asm,10006+20001,290.5159
gfx936,int8_w8a8_channel,torch.float16,100,128,3072,256,8,0,0,asm,10007+20001,290.2801
gfx936,int8_w8a8_channel,torch.float16,112,128,3072,256,8,0,0,asm,10006+20001,297.9432
gfx936,int8_w8a8_channel,torch.float16,128,128,3072,256,8,0,0,asm,10006+20001,303.0295
gfx936,int8_w8a8_channel,torch.float16,144,128,3072,256,8,0,0,asm,10007+20001,308.2674
gfx936,int8_w8a8_channel,torch.float16,160,128,3072,256,8,0,0,asm,10006+20001,312.2084
gfx936,int8_w8a8_channel,torch.float16,192,128,3072,256,8,0,0,asm,10007+20001,314.9031
gfx936,int8_w8a8_channel,torch.float16,224,128,3072,256,8,0,0,asm,10006+20001,321.6316
gfx936,int8_w8a8_channel,torch.float16,256,128,3072,256,8,0,0,asm,10006+20001,325.6231
gfx936,int8_w8a8_channel,torch.float16,320,128,3072,256,8,0,0,asm,10006+20001,337.0926
gfx936,int8_w8a8_channel,torch.float16,384,128,3072,256,8,0,0,asm,10006+20001,349.8673
gfx936,int8_w8a8_channel,torch.float16,448,128,3072,256,8,0,0,asm,11006+21001,364.8736
gfx936,int8_w8a8_channel,torch.float16,512,128,3072,256,8,0,0,asm,11006+21001,377.1262
gfx936,int8_w8a8_channel,torch.float16,640,128,3072,256,8,0,0,asm,11002+21001,394.7514
gfx936,int8_w8a8_channel,torch.float16,768,128,3072,256,8,0,0,asm,11006+21001,415.0208
gfx936,int8_w8a8_channel,torch.float16,896,128,3072,256,8,0,0,asm,11006+21001,438.9619
gfx936,int8_w8a8_channel,torch.float16,1024,128,3072,256,8,0,0,asm,11007+21001,469.1261
gfx936,int8_w8a8_channel,torch.float16,1280,128,3072,256,8,0,0,asm,12004+21102,498.0102
gfx936,int8_w8a8_channel,torch.float16,1536,128,3072,256,8,0,0,asm,12004+22001,547.5512
gfx936,int8_w8a8_channel,torch.float16,2048,128,3072,256,8,0,0,asm,12005+22001,654.5574
gfx936,int8_w8a8_channel,torch.float16,2304,128,3072,256,8,0,0,asm,12005+21102,716.8814
gfx936,int8_w8a8_channel,torch.float16,2560,128,3072,256,8,0,0,asm,12005+21102,751.2982
gfx936,int8_w8a8_channel,torch.float16,3072,128,3072,256,8,0,0,asm,12005+21102,821.4792
gfx936,int8_w8a8_channel,torch.float16,3584,128,3072,256,8,0,0,asm,12005+22001,902.3379
gfx936,int8_w8a8_channel,torch.float16,4096,128,3072,256,8,0,0,asm,12005+22001,1016.4852
gfx936,int8_w8a8_channel,torch.float16,5120,128,3072,256,8,0,0,asm,12005+22001,1233.2848
gfx936,int8_w8a8_channel,torch.float16,6144,128,3072,256,8,0,0,asm,13001+23001,1410.4297
gfx936,int8_w8a8_channel,torch.float16,7168,128,3072,256,8,0,0,asm,13001+23001,1532.0043
gfx936,int8_w8a8_channel,torch.float16,8192,128,3072,256,8,0,0,asm,13001+23001,1765.966
gfx936,int8_w8a8_channel,torch.float16,10240,128,3072,256,8,0,0,asm,13001+23001,2124.0959
gfx936,int8_w8a8_channel,torch.float16,12288,128,3072,256,8,0,0,asm,13001+23001,2490.6301
gfx936,int8_w8a8_channel,torch.float16,16384,128,3072,256,8,0,0,asm,13001+21102,3151.1006
gfx936,int8_w8a8_channel,torch.float16,24576,128,3072,256,8,0,0,asm,13001+23001,4696.4204
gfx936,int8_w8a8_channel,torch.float16,32768,128,3072,256,8,0,0,asm,13001+23001,6188.8897
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,int8_w8a8_block,torch.float16,1,128,7168,256,8,0,0,asm,10008+20000,63.7404
gfx936,int8_w8a8_block,torch.float16,2,128,7168,256,8,0,0,asm,10007+20101,79.8125
gfx936,int8_w8a8_block,torch.float16,3,128,7168,256,8,0,0,asm,10002+20101,98.4464
gfx936,int8_w8a8_block,torch.float16,4,128,7168,256,8,0,0,asm,10003+20101,116.8833
gfx936,int8_w8a8_block,torch.float16,5,128,7168,256,8,0,0,asm,10006+20101,136.7469
gfx936,int8_w8a8_block,torch.float16,6,128,7168,256,8,0,0,asm,10006+20101,163.1216
gfx936,int8_w8a8_block,torch.float16,7,128,7168,256,8,0,0,asm,10006+20101,181.9707
gfx936,int8_w8a8_block,torch.float16,8,128,7168,256,8,0,0,asm,10005+20101,195.1672
gfx936,int8_w8a8_block,torch.float16,9,128,7168,256,8,0,0,asm,10005+20101,209.4906
gfx936,int8_w8a8_block,torch.float16,10,128,7168,256,8,0,0,asm,10003+20101,225.9173
gfx936,int8_w8a8_block,torch.float16,11,128,7168,256,8,0,0,asm,10003+20101,242.8814
gfx936,int8_w8a8_block,torch.float16,12,128,7168,256,8,0,0,asm,10003+20101,255.8416
gfx936,int8_w8a8_block,torch.float16,13,128,7168,256,8,0,0,asm,10007+20101,278.0101
gfx936,int8_w8a8_block,torch.float16,14,128,7168,256,8,0,0,asm,10007+20101,289.544
gfx936,int8_w8a8_block,torch.float16,15,128,7168,256,8,0,0,asm,10007+20101,299.8415
gfx936,int8_w8a8_block,torch.float16,16,128,7168,256,8,0,0,asm,10007+20101,307.062
gfx936,int8_w8a8_block,torch.float16,17,128,7168,256,8,0,0,asm,10007+20101,313.7174
gfx936,int8_w8a8_block,torch.float16,18,128,7168,256,8,0,0,asm,10003+20101,323.5229
gfx936,int8_w8a8_block,torch.float16,20,128,7168,256,8,0,0,asm,10003+20101,349.3318
gfx936,int8_w8a8_block,torch.float16,24,128,7168,256,8,0,0,asm,10003+20000,404.6977
gfx936,int8_w8a8_block,torch.float16,28,128,7168,256,8,0,0,asm,10003+20000,446.2247
gfx936,int8_w8a8_block,torch.float16,32,128,7168,256,8,0,0,asm,10007+20000,493.6303
gfx936,int8_w8a8_block,torch.float16,34,128,7168,256,8,0,0,asm,10003+20000,489.455
gfx936,int8_w8a8_block,torch.float16,36,128,7168,256,8,0,0,asm,10003+20000,503.2231
gfx936,int8_w8a8_block,torch.float16,40,128,7168,256,8,0,0,asm,10003+20000,517.8023
gfx936,int8_w8a8_block,torch.float16,44,128,7168,256,8,0,0,asm,10003+20000,537.7135
gfx936,int8_w8a8_block,torch.float16,48,128,7168,256,8,0,0,asm,10003+20000,554.3905
gfx936,int8_w8a8_block,torch.float16,56,128,7168,256,8,0,0,asm,10003+20000,593.1802
gfx936,int8_w8a8_block,torch.float16,64,128,7168,256,8,0,0,asm,10003+20000,606.4151
gfx936,int8_w8a8_block,torch.float16,68,128,7168,256,8,0,0,asm,10003+20000,612.0233
gfx936,int8_w8a8_block,torch.float16,72,128,7168,256,8,0,0,asm,10003+20000,624.0316
gfx936,int8_w8a8_block,torch.float16,80,128,7168,256,8,0,0,asm,10003+20000,640.1463
gfx936,int8_w8a8_block,torch.float16,88,128,7168,256,8,0,0,asm,10003+20000,659.9413
gfx936,int8_w8a8_block,torch.float16,96,128,7168,256,8,0,0,asm,10003+20000,690.9444
gfx936,int8_w8a8_block,torch.float16,104,128,7168,256,8,0,0,asm,10003+20000,696.5691
gfx936,int8_w8a8_block,torch.float16,112,128,7168,256,8,0,0,asm,10003+20000,704.9834
gfx936,int8_w8a8_block,torch.float16,128,128,7168,256,8,0,0,asm,10003+20000,712.97
gfx936,int8_w8a8_block,torch.float16,144,128,7168,256,8,0,0,asm,10003+20000,722.0132
gfx936,int8_w8a8_block,torch.float16,160,128,7168,256,8,0,0,asm,10003+20000,729.5175
gfx936,int8_w8a8_block,torch.float16,192,128,7168,256,8,0,0,asm,10003+20000,740.1296
gfx936,int8_w8a8_block,torch.float16,224,128,7168,256,8,0,0,asm,10003+20000,752.1505
gfx936,int8_w8a8_block,torch.float16,256,128,7168,256,8,0,0,asm,10003+20000,768.2856
gfx936,int8_w8a8_block,torch.float16,320,128,7168,256,8,0,0,asm,10003+20000,784.1603
gfx936,int8_w8a8_block,torch.float16,384,128,7168,256,8,0,0,asm,10003+20000,830.0833
gfx936,int8_w8a8_block,torch.float16,448,128,7168,256,8,0,0,asm,10003+20101,846.3959
gfx936,int8_w8a8_block,torch.float16,512,128,7168,256,8,0,0,asm,10006+20101,865.5128
gfx936,int8_w8a8_block,torch.float16,576,128,7168,256,8,0,0,asm,10006+20101,898.4684
gfx936,int8_w8a8_block,torch.float16,640,128,7168,256,8,0,0,asm,10006+20101,893.4055
gfx936,int8_w8a8_block,torch.float16,704,128,7168,256,8,0,0,asm,10006+20101,938.4277
gfx936,int8_w8a8_block,torch.float16,768,128,7168,256,8,0,0,asm,10006+20101,953.3184
gfx936,int8_w8a8_block,torch.float16,832,128,7168,256,8,0,0,asm,10006+20101,978.7358
gfx936,int8_w8a8_block,torch.float16,896,128,7168,256,8,0,0,asm,11010+21000,1001.8931
gfx936,int8_w8a8_block,torch.float16,960,128,7168,256,8,0,0,asm,11005+21101,1042.8664
gfx936,int8_w8a8_block,torch.float16,1024,128,7168,256,8,0,0,asm,11010+21101,1034.9833
gfx936,int8_w8a8_block,torch.float16,1152,128,7168,256,8,0,0,asm,11010+21101,1114.3541
gfx936,int8_w8a8_block,torch.float16,1280,128,7168,256,8,0,0,asm,11010+21101,1184.8115
gfx936,int8_w8a8_block,torch.float16,1408,128,7168,256,8,0,0,asm,11010+21101,1225.7346
gfx936,int8_w8a8_block,torch.float16,1536,128,7168,256,8,0,0,asm,11010+21000,1249.6403
gfx936,int8_w8a8_block,torch.float16,1664,128,7168,256,8,0,0,asm,11010+21000,1287.2281
gfx936,int8_w8a8_block,torch.float16,1792,128,7168,256,8,0,0,asm,11010+21000,1338.4978
gfx936,int8_w8a8_block,torch.float16,1920,128,7168,256,8,0,0,asm,11010+21000,1430.4692
gfx936,int8_w8a8_block,torch.float16,2048,128,7168,256,8,0,0,asm,11010+21000,1474.3052
gfx936,int8_w8a8_block,torch.float16,2304,128,7168,256,8,0,0,asm,11010+21000,1650.0345
gfx936,int8_w8a8_block,torch.float16,2560,128,7168,256,8,0,0,asm,11010+21000,1784.6972
gfx936,int8_w8a8_block,torch.float16,2816,128,7168,256,8,0,0,asm,12003+22000,1881.0829
gfx936,int8_w8a8_block,torch.float16,3072,128,7168,256,8,0,0,asm,12003+22000,1954.5763
gfx936,int8_w8a8_block,torch.float16,3328,128,7168,256,8,0,0,asm,12003+22000,2018.8923
gfx936,int8_w8a8_block,torch.float16,3584,128,7168,256,8,0,0,asm,12002+22000,2090.7939
gfx936,int8_w8a8_block,torch.float16,3840,128,7168,256,8,0,0,asm,13001+23000,2233.9531
gfx936,int8_w8a8_block,torch.float16,4096,128,7168,256,8,0,0,asm,12003+22000,2389.9122
gfx936,int8_w8a8_block,torch.float16,4608,128,7168,256,8,0,0,asm,12003+22000,2796.4766
gfx936,int8_w8a8_block,torch.float16,5120,128,7168,256,8,0,0,asm,12003+22000,2925.479
gfx936,int8_w8a8_block,torch.float16,5632,128,7168,256,8,0,0,asm,12003+22000,3117.6873
gfx936,int8_w8a8_block,torch.float16,6144,128,7168,256,8,0,0,asm,13001+23000,3331.6854
gfx936,int8_w8a8_block,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23000,3475.6528
gfx936,int8_w8a8_block,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23000,3553.7657
gfx936,int8_w8a8_block,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23000,3742.4152
gfx936,int8_w8a8_block,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23000,4155.1571
gfx936,int8_w8a8_block,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23000,5095.7734
gfx936,int8_w8a8_block,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23000,5989.5664
gfx936,int8_w8a8_block,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23000,6841.5631
gfx936,int8_w8a8_block,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23000,7769.2863
gfx936,int8_w8a8_block,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23000,8326.1077
gfx936,int8_w8a8_block,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23000,11274.742
gfx936,int8_w8a8_block,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23000,14891.7267
gfx936,int8_w8a8_block,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,14976.8469
gfx936,int8_w8a8_block,torch.float16,1,256,7168,256,8,0,0,asm,10007+20000,80.2568
gfx936,int8_w8a8_block,torch.float16,2,256,7168,256,8,0,0,asm,10003+20000,122.6887
gfx936,int8_w8a8_block,torch.float16,3,256,7168,256,8,0,0,asm,10006+20000,172.0341
gfx936,int8_w8a8_block,torch.float16,4,256,7168,256,8,0,0,asm,10003+20000,217.8065
gfx936,int8_w8a8_block,torch.float16,5,256,7168,256,8,0,0,asm,10007+20000,248.4376
gfx936,int8_w8a8_block,torch.float16,6,256,7168,256,8,0,0,asm,10007+20000,282.8901
gfx936,int8_w8a8_block,torch.float16,7,256,7168,256,8,0,0,asm,10003+20000,317.7122
gfx936,int8_w8a8_block,torch.float16,8,256,7168,256,8,0,0,asm,10003+20000,336.703
gfx936,int8_w8a8_block,torch.float16,9,256,7168,256,8,0,0,asm,10007+20000,374.1512
gfx936,int8_w8a8_block,torch.float16,10,256,7168,256,8,0,0,asm,10003+20000,398.1841
gfx936,int8_w8a8_block,torch.float16,11,256,7168,256,8,0,0,asm,10003+20000,418.7215
gfx936,int8_w8a8_block,torch.float16,12,256,7168,256,8,0,0,asm,10003+20000,443.9523
gfx936,int8_w8a8_block,torch.float16,13,256,7168,256,8,0,0,asm,10007+20000,474.1513
gfx936,int8_w8a8_block,torch.float16,14,256,7168,256,8,0,0,asm,10003+20000,506.9882
gfx936,int8_w8a8_block,torch.float16,15,256,7168,256,8,0,0,asm,10003+20000,518.1636
gfx936,int8_w8a8_block,torch.float16,16,256,7168,256,8,0,0,asm,10003+20000,533.6549
gfx936,int8_w8a8_block,torch.float16,17,256,7168,256,8,0,0,asm,10007+20000,555.4758
gfx936,int8_w8a8_block,torch.float16,18,256,7168,256,8,0,0,asm,10007+20000,577.8488
gfx936,int8_w8a8_block,torch.float16,20,256,7168,256,8,0,0,asm,10003+20000,614.095
gfx936,int8_w8a8_block,torch.float16,24,256,7168,256,8,0,0,asm,10003+20000,700.5279
gfx936,int8_w8a8_block,torch.float16,28,256,7168,256,8,0,0,asm,10003+20000,793.3022
gfx936,int8_w8a8_block,torch.float16,32,256,7168,256,8,0,0,asm,10003+20000,863.8623
gfx936,int8_w8a8_block,torch.float16,34,256,7168,256,8,0,0,asm,10003+20000,862.3536
gfx936,int8_w8a8_block,torch.float16,36,256,7168,256,8,0,0,asm,10003+20000,889.8244
gfx936,int8_w8a8_block,torch.float16,40,256,7168,256,8,0,0,asm,10003+20000,942.5301
gfx936,int8_w8a8_block,torch.float16,44,256,7168,256,8,0,0,asm,10003+20000,974.4275
gfx936,int8_w8a8_block,torch.float16,48,256,7168,256,8,0,0,asm,10003+20000,1000.9915
gfx936,int8_w8a8_block,torch.float16,56,256,7168,256,8,0,0,asm,10003+20000,1061.9148
gfx936,int8_w8a8_block,torch.float16,64,256,7168,256,8,0,0,asm,10003+20000,1100.0501
gfx936,int8_w8a8_block,torch.float16,68,256,7168,256,8,0,0,asm,10003+20000,1111.5972
gfx936,int8_w8a8_block,torch.float16,72,256,7168,256,8,0,0,asm,10003+20000,1149.8897
gfx936,int8_w8a8_block,torch.float16,80,256,7168,256,8,0,0,asm,10003+20000,1174.1255
gfx936,int8_w8a8_block,torch.float16,88,256,7168,256,8,0,0,asm,10003+20000,1207.7073
gfx936,int8_w8a8_block,torch.float16,96,256,7168,256,8,0,0,asm,10003+20000,1241.1748
gfx936,int8_w8a8_block,torch.float16,104,256,7168,256,8,0,0,asm,10003+20000,1256.1221
gfx936,int8_w8a8_block,torch.float16,112,256,7168,256,8,0,0,asm,10003+20000,1267.3836
gfx936,int8_w8a8_block,torch.float16,128,256,7168,256,8,0,0,asm,10003+20000,1294.4442
gfx936,int8_w8a8_block,torch.float16,144,256,7168,256,8,0,0,asm,10003+20000,1309.413
gfx936,int8_w8a8_block,torch.float16,160,256,7168,256,8,0,0,asm,10003+20000,1331.2852
gfx936,int8_w8a8_block,torch.float16,192,256,7168,256,8,0,0,asm,10003+20000,1338.8944
gfx936,int8_w8a8_block,torch.float16,224,256,7168,256,8,0,0,asm,10003+20000,1367.4452
gfx936,int8_w8a8_block,torch.float16,256,256,7168,256,8,0,0,asm,10003+20000,1382.0245
gfx936,int8_w8a8_block,torch.float16,320,256,7168,256,8,0,0,asm,10003+20000,1411.4382
gfx936,int8_w8a8_block,torch.float16,384,256,7168,256,8,0,0,asm,10003+20000,1446.7848
gfx936,int8_w8a8_block,torch.float16,448,256,7168,256,8,0,0,asm,10002+20000,1488.5131
gfx936,int8_w8a8_block,torch.float16,512,256,7168,256,8,0,0,asm,10001+20000,1510.4197
gfx936,int8_w8a8_block,torch.float16,576,256,7168,256,8,0,0,asm,10001+20000,1556.0915
gfx936,int8_w8a8_block,torch.float16,640,256,7168,256,8,0,0,asm,10006+20000,1567.0515
gfx936,int8_w8a8_block,torch.float16,704,256,7168,256,8,0,0,asm,10006+20000,1610.1326
gfx936,int8_w8a8_block,torch.float16,768,256,7168,256,8,0,0,asm,10005+20000,1635.4823
gfx936,int8_w8a8_block,torch.float16,832,256,7168,256,8,0,0,asm,10006+20000,1682.6332
gfx936,int8_w8a8_block,torch.float16,896,256,7168,256,8,0,0,asm,11010+21000,1697.1069
gfx936,int8_w8a8_block,torch.float16,960,256,7168,256,8,0,0,asm,11010+21000,1700.2086
gfx936,int8_w8a8_block,torch.float16,1024,256,7168,256,8,0,0,asm,11010+21000,1720.3522
gfx936,int8_w8a8_block,torch.float16,1152,256,7168,256,8,0,0,asm,11010+21000,1778.3173
gfx936,int8_w8a8_block,torch.float16,1280,256,7168,256,8,0,0,asm,11010+21000,1827.6876
gfx936,int8_w8a8_block,torch.float16,1408,256,7168,256,8,0,0,asm,11010+21000,1872.7174
gfx936,int8_w8a8_block,torch.float16,1536,256,7168,256,8,0,0,asm,11010+21000,1895.9745
gfx936,int8_w8a8_block,torch.float16,1664,256,7168,256,8,0,0,asm,12002+22000,2006.5225
gfx936,int8_w8a8_block,torch.float16,1792,256,7168,256,8,0,0,asm,11010+21000,2046.6170
gfx936,int8_w8a8_block,torch.float16,1920,256,7168,256,8,0,0,asm,11010+21000,2121.2345
gfx936,int8_w8a8_block,torch.float16,2048,256,7168,256,8,0,0,asm,11010+21000,2219.9136
gfx936,int8_w8a8_block,torch.float16,2304,256,7168,256,8,0,0,asm,12003+22000,2360.6029
gfx936,int8_w8a8_block,torch.float16,2560,256,7168,256,8,0,0,asm,12003+22000,2489.4727
gfx936,int8_w8a8_block,torch.float16,2816,256,7168,256,8,0,0,asm,12003+22000,2548.1644
gfx936,int8_w8a8_block,torch.float16,3072,256,7168,256,8,0,0,asm,12003+22000,2617.9286
gfx936,int8_w8a8_block,torch.float16,3328,256,7168,256,8,0,0,asm,12002+22000,2725.5706
gfx936,int8_w8a8_block,torch.float16,3584,256,7168,256,8,0,0,asm,12002+22000,2857.6904
gfx936,int8_w8a8_block,torch.float16,3840,256,7168,256,8,0,0,asm,12003+22000,3012.7306
gfx936,int8_w8a8_block,torch.float16,4096,256,7168,256,8,0,0,asm,12003+22000,3240.8408
gfx936,int8_w8a8_block,torch.float16,4608,256,7168,256,8,0,0,asm,12002+22000,3771.4593
gfx936,int8_w8a8_block,torch.float16,5120,256,7168,256,8,0,0,asm,12003+22000,3994.7498
gfx936,int8_w8a8_block,torch.float16,5632,256,7168,256,8,0,0,asm,12003+22000,4164.8792
gfx936,int8_w8a8_block,torch.float16,6144,256,7168,256,8,0,0,asm,12003+22000,4594.9062
gfx936,int8_w8a8_block,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23000,4701.4746
gfx936,int8_w8a8_block,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23000,4834.3727
gfx936,int8_w8a8_block,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23000,5090.3775
gfx936,int8_w8a8_block,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23000,5702.3206
gfx936,int8_w8a8_block,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23000,6923.0831
gfx936,int8_w8a8_block,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23000,7896.9686
gfx936,int8_w8a8_block,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23000,9011.7101
gfx936,int8_w8a8_block,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23000,10138.9121
gfx936,int8_w8a8_block,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23000,10933.3982
gfx936,int8_w8a8_block,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23000,14921.2994
gfx936,int8_w8a8_block,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23000,19669.379
gfx938,f8_w8a8_block,torch.float16,1,640,6144,160,8,0,0,asm,10004+20000,114.4839
gfx938,f8_w8a8_block,torch.float16,2,640,6144,160,8,0,0,asm,10002+20000,182.6896
gfx938,f8_w8a8_block,torch.float16,4,640,6144,160,8,0,0,asm,10002+20000,296.1749
gfx938,f8_w8a8_block,torch.float16,6,640,6144,160,8,0,0,asm,10002+20000,396.2887
gfx938,f8_w8a8_block,torch.float16,8,640,6144,160,8,0,0,asm,10006+20000,443.7173
gfx938,f8_w8a8_block,torch.float16,10,640,6144,160,8,0,0,asm,10006+20000,523.6483
gfx938,f8_w8a8_block,torch.float16,12,640,6144,160,8,0,0,asm,10006+20000,708.6077
gfx938,f8_w8a8_block,torch.float16,14,640,6144,160,8,0,0,asm,10006+20000,709.362
gfx938,f8_w8a8_block,torch.float16,16,640,6144,160,8,0,0,asm,10006+20000,753.3843
gfx938,f8_w8a8_block,torch.float16,20,640,6144,160,8,0,0,asm,10006+20000,846.0213
gfx938,f8_w8a8_block,torch.float16,24,640,6144,160,8,0,0,asm,10006+20000,924.3524
gfx938,f8_w8a8_block,torch.float16,28,640,6144,160,8,0,0,asm,10006+20000,1038.6179
gfx938,f8_w8a8_block,torch.float16,32,640,6144,160,8,0,0,asm,10006+20000,1145.2919
gfx938,f8_w8a8_block,torch.float16,36,640,6144,160,8,0,0,asm,10006+20000,1136.6487
gfx938,f8_w8a8_block,torch.float16,40,640,6144,160,8,0,0,asm,10006+20000,1221.997
gfx938,f8_w8a8_block,torch.float16,44,640,6144,160,8,0,0,asm,10006+20000,1231.3686
gfx938,f8_w8a8_block,torch.float16,48,640,6144,160,8,0,0,asm,10006+20000,1222.317
gfx938,f8_w8a8_block,torch.float16,56,640,6144,160,8,0,0,asm,10006+20000,1245.2197
gfx938,f8_w8a8_block,torch.float16,64,640,6144,160,8,0,0,asm,10006+20000,1321.0139
gfx938,f8_w8a8_block,torch.float16,72,640,6144,160,8,0,0,asm,10006+20000,1333.0137
gfx938,f8_w8a8_block,torch.float16,80,640,6144,160,8,0,0,asm,10006+20000,1342.5223
gfx938,f8_w8a8_block,torch.float16,96,640,6144,160,8,0,0,asm,10006+20000,1349.2423
gfx938,f8_w8a8_block,torch.float16,112,640,6144,160,8,0,0,asm,10006+20000,1356.7167
gfx938,f8_w8a8_block,torch.float16,128,640,6144,160,8,0,0,asm,10006+20000,1364.168
gfx938,f8_w8a8_block,torch.float16,160,640,6144,160,8,0,0,asm,10005+20000,1400.0537
gfx938,f8_w8a8_block,torch.float16,192,640,6144,160,8,0,0,asm,10006+20000,1375.208
gfx938,f8_w8a8_block,torch.float16,224,640,6144,160,8,0,0,asm,10006+20000,1382.2936
gfx938,f8_w8a8_block,torch.float16,256,640,6144,160,8,0,0,asm,11010+21000,1437.9049
gfx938,f8_w8a8_block,torch.float16,320,640,6144,160,8,0,0,asm,11010+21000,1438.979
gfx938,f8_w8a8_block,torch.float16,384,640,6144,160,8,0,0,asm,11010+21000,1464.3047
gfx938,f8_w8a8_block,torch.float16,448,640,6144,160,8,0,0,asm,11010+21000,1474.1106
gfx938,f8_w8a8_block,torch.float16,512,640,6144,160,8,0,0,asm,11010+21000,1570.43
gfx938,f8_w8a8_block,torch.float16,576,640,6144,160,8,0,0,asm,11010+21000,1654.9783
gfx938,f8_w8a8_block,torch.float16,640,640,6144,160,8,0,0,asm,12003+22000,1710.4297
gfx938,f8_w8a8_block,torch.float16,704,640,6144,160,8,0,0,asm,12003+22000,1718.4066
gfx938,f8_w8a8_block,torch.float16,768,640,6144,160,8,0,0,asm,12003+22000,1753.5607
gfx938,f8_w8a8_block,torch.float16,832,640,6144,160,8,0,0,asm,12003+22000,1732.2353
gfx938,f8_w8a8_block,torch.float16,896,640,6144,160,8,0,0,asm,12003+22000,1750.4294
gfx938,f8_w8a8_block,torch.float16,960,640,6144,160,8,0,0,asm,12003+22000,1779.0921
gfx938,f8_w8a8_block,torch.float16,1024,640,6144,160,8,0,0,asm,12003+22000,1807.4806
gfx938,f8_w8a8_block,torch.float16,1152,640,6144,160,8,0,0,asm,12003+22000,2098.5427
gfx938,f8_w8a8_block,torch.float16,1280,640,6144,160,8,0,0,asm,12003+22000,2514.1524
gfx938,f8_w8a8_block,torch.float16,1408,640,6144,160,8,0,0,asm,13001+23000,2827.8653
gfx938,f8_w8a8_block,torch.float16,1536,640,6144,160,8,0,0,asm,13001+23000,2882.8137
gfx938,f8_w8a8_block,torch.float16,1664,640,6144,160,8,0,0,asm,13001+23000,2898.928
gfx938,f8_w8a8_block,torch.float16,1792,640,6144,160,8,0,0,asm,13001+23000,2948.482
gfx938,f8_w8a8_block,torch.float16,1920,640,6144,160,8,0,0,asm,13001+23000,2973.7393
gfx938,f8_w8a8_block,torch.float16,2048,640,6144,160,8,0,0,asm,13001+23000,3015.4761
gfx938,f8_w8a8_block,torch.float16,2304,640,6144,160,8,0,0,asm,13001+23000,3273.1666
gfx938,f8_w8a8_block,torch.float16,2560,640,6144,160,8,0,0,asm,13001+23000,4072.615
gfx938,f8_w8a8_block,torch.float16,2816,640,6144,160,8,0,0,asm,12003+22000,4727.9041
gfx938,f8_w8a8_block,torch.float16,3072,640,6144,160,8,0,0,asm,12003+22000,5005.6631
gfx938,f8_w8a8_block,torch.float16,3328,640,6144,160,8,0,0,asm,12002+22000,5183.2396
gfx938,f8_w8a8_block,torch.float16,3584,640,6144,160,8,0,0,asm,12003+22000,5355.6046
gfx938,f8_w8a8_block,torch.float16,3840,640,6144,160,8,0,0,asm,13001+23000,5496.1756
gfx938,f8_w8a8_block,torch.float16,4096,640,6144,160,8,0,0,asm,13001+23000,5534.8724
gfx938,f8_w8a8_block,torch.float16,4608,640,6144,160,8,0,0,asm,13001+23000,5797.9573
gfx938,f8_w8a8_block,torch.float16,5120,640,6144,160,8,0,0,asm,13001+23000,6765.4964
gfx938,f8_w8a8_block,torch.float16,5632,640,6144,160,8,0,0,asm,13001+23000,7835.6411
gfx938,f8_w8a8_block,torch.float16,6144,640,6144,160,8,0,0,asm,13001+23000,8137.0799
gfx938,f8_w8a8_block,torch.float16,6656,640,6144,160,8,0,0,asm,13001+23000,8280.3481
gfx938,f8_w8a8_block,torch.float16,6144,640,6144,160,8,0,0,asm,13001+23000,8145.354299999999
gfx938,f8_w8a8_block,torch.float16,7680,640,6144,160,8,0,0,asm,13001+23000,9456.8466
gfx938,f8_w8a8_block,torch.float16,8192,640,6144,160,8,0,0,asm,13001+23000,10519.174
gfx938,f8_w8a8_block,torch.float16,10240,640,6144,160,8,0,0,asm,13001+23000,12172.1051
gfx938,f8_w8a8_block,torch.float16,12288,640,6144,160,8,0,0,asm,13001+23000,14116.4186
gfx938,f8_w8a8_block,torch.float16,14336,640,6144,160,8,0,0,asm,13001+23000,16463.9983
gfx938,f8_w8a8_block,torch.float16,16384,640,6144,160,8,0,0,asm,13001+23000,19025.4974
gfx938,f8_w8a8_block,torch.float16,17408,640,6144,160,8,0,0,asm,13001+23000,19739.369
gfx938,f8_w8a8_block,torch.float16,24576,640,6144,160,8,0,0,asm,14001+24000,27498.6319
gfx938,f8_w8a8_block,torch.float16,32768,640,6144,160,8,0,0,asm,13001+23000,36345.2053
gfx938,f8_w8a8_block,torch.float16,40960,640,6144,160,8,0,0,asm,14001+24000,45806.7474
gfx938,f8_w8a8_block,torch.float16,49152,640,6144,160,8,0,0,asm,13001+23000,52580.0251
gfx938,f8_w8a8_block,torch.float16,49152,640,6144,160,8,0,0,asm,13001+23000,52522.882
gfx938,f8_w8a8_block,torch.float16,57344,640,6144,160,8,0,0,asm,13001+23000,61427.7869
gfx938,f8_w8a8_block,torch.float16,65536,640,6144,160,8,0,0,asm,13001+23000,70414.4733
gfx938,int8_w8a8_block,torch.float16,1,128,7168,256,8,0,0,asm,10008+20100,65.3628
gfx938,int8_w8a8_block,torch.float16,2,128,7168,256,8,0,0,asm,10007+20101,75.4754
gfx938,int8_w8a8_block,torch.float16,3,128,7168,256,8,0,0,asm,10002+20101,87.4921
gfx938,int8_w8a8_block,torch.float16,4,128,7168,256,8,0,0,asm,10002+20101,103.5248
gfx938,int8_w8a8_block,torch.float16,5,128,7168,256,8,0,0,asm,10005+20101,132.4518
gfx938,int8_w8a8_block,torch.float16,6,128,7168,256,8,0,0,asm,10006+20101,133.4817
gfx938,int8_w8a8_block,torch.float16,7,128,7168,256,8,0,0,asm,10006+20101,140.1565
gfx938,int8_w8a8_block,torch.float16,8,128,7168,256,8,0,0,asm,10006+20101,147.0241
gfx938,int8_w8a8_block,torch.float16,9,128,7168,256,8,0,0,asm,10005+20101,162.4947
gfx938,int8_w8a8_block,torch.float16,10,128,7168,256,8,0,0,asm,10002+20101,177.8177
gfx938,int8_w8a8_block,torch.float16,11,128,7168,256,8,0,0,asm,10007+20101,212.4555
gfx938,int8_w8a8_block,torch.float16,12,128,7168,256,8,0,0,asm,10007+20101,214.556
gfx938,int8_w8a8_block,torch.float16,13,128,7168,256,8,0,0,asm,10007+20101,219.7253
gfx938,int8_w8a8_block,torch.float16,14,128,7168,256,8,0,0,asm,10002+20101,223.9386
gfx938,int8_w8a8_block,torch.float16,15,128,7168,256,8,0,0,asm,10002+20101,224.7386
gfx938,int8_w8a8_block,torch.float16,16,128,7168,256,8,0,0,asm,10002+20101,228.4719
gfx938,int8_w8a8_block,torch.float16,17,128,7168,256,8,0,0,asm,10002+20101,234.594
gfx938,int8_w8a8_block,torch.float16,18,128,7168,256,8,0,0,asm,11006+21101,243.9848
gfx938,int8_w8a8_block,torch.float16,20,128,7168,256,8,0,0,asm,10006+20101,258.721
gfx938,int8_w8a8_block,torch.float16,24,128,7168,256,8,0,0,asm,10006+20101,278.7332
gfx938,int8_w8a8_block,torch.float16,28,128,7168,256,8,0,0,asm,10002+20101,356.5123
gfx938,int8_w8a8_block,torch.float16,32,128,7168,256,8,0,0,asm,10002+20101,362.3954
gfx938,int8_w8a8_block,torch.float16,34,128,7168,256,8,0,0,asm,10002+20101,350.9258
gfx938,int8_w8a8_block,torch.float16,36,128,7168,256,8,0,0,asm,10001+20101,362.5073
gfx938,int8_w8a8_block,torch.float16,40,128,7168,256,8,0,0,asm,10006+20101,378.4456
gfx938,int8_w8a8_block,torch.float16,44,128,7168,256,8,0,0,asm,10006+20101,382.5933
gfx938,int8_w8a8_block,torch.float16,48,128,7168,256,8,0,0,asm,10006+20101,389.781
gfx938,int8_w8a8_block,torch.float16,56,128,7168,256,8,0,0,asm,10006+20101,405.1448
gfx938,int8_w8a8_block,torch.float16,64,128,7168,256,8,0,0,asm,10001+20101,450.9047
gfx938,int8_w8a8_block,torch.float16,68,128,7168,256,8,0,0,asm,10002+20101,467.5835
gfx938,int8_w8a8_block,torch.float16,72,128,7168,256,8,0,0,asm,10001+20101,487.1343
gfx938,int8_w8a8_block,torch.float16,80,128,7168,256,8,0,0,asm,10002+20101,494.9825
gfx938,int8_w8a8_block,torch.float16,88,128,7168,256,8,0,0,asm,10002+20101,485.7603
gfx938,int8_w8a8_block,torch.float16,96,128,7168,256,8,0,0,asm,10001+20101,489.641
gfx938,int8_w8a8_block,torch.float16,104,128,7168,256,8,0,0,asm,10006+20101,493.7969
gfx938,int8_w8a8_block,torch.float16,112,128,7168,256,8,0,0,asm,10006+20101,498.8307
gfx938,int8_w8a8_block,torch.float16,128,128,7168,256,8,0,0,asm,10006+20101,499.3353
gfx938,int8_w8a8_block,torch.float16,144,128,7168,256,8,0,0,asm,10006+20101,518.006
gfx938,int8_w8a8_block,torch.float16,160,128,7168,256,8,0,0,asm,10006+20101,516.6111
gfx938,int8_w8a8_block,torch.float16,192,128,7168,256,8,0,0,asm,10006+20101,526.847
gfx938,int8_w8a8_block,torch.float16,224,128,7168,256,8,0,0,asm,10006+20101,529.85
gfx938,int8_w8a8_block,torch.float16,256,128,7168,256,8,0,0,asm,10006+20101,536.2951
gfx938,int8_w8a8_block,torch.float16,320,128,7168,256,8,0,0,asm,10006+20101,550.3832
gfx938,int8_w8a8_block,torch.float16,384,128,7168,256,8,0,0,asm,10006+20101,554.535
gfx938,int8_w8a8_block,torch.float16,448,128,7168,256,8,0,0,asm,10006+20101,604.2578
gfx938,int8_w8a8_block,torch.float16,512,128,7168,256,8,0,0,asm,11010+21101,625.9029
gfx938,int8_w8a8_block,torch.float16,576,128,7168,256,8,0,0,asm,11010+21101,643.6505
gfx938,int8_w8a8_block,torch.float16,640,128,7168,256,8,0,0,asm,11010+21101,655.6136
gfx938,int8_w8a8_block,torch.float16,704,128,7168,256,8,0,0,asm,11010+21101,664.6596
gfx938,int8_w8a8_block,torch.float16,768,128,7168,256,8,0,0,asm,11010+21101,669.9929
gfx938,int8_w8a8_block,torch.float16,832,128,7168,256,8,0,0,asm,11010+21101,671.3098
gfx938,int8_w8a8_block,torch.float16,896,128,7168,256,8,0,0,asm,11010+21101,736.6869
gfx938,int8_w8a8_block,torch.float16,960,128,7168,256,8,0,0,asm,11010+21101,750.3509
gfx938,int8_w8a8_block,torch.float16,1024,128,7168,256,8,0,0,asm,11010+21101,828.613
gfx938,int8_w8a8_block,torch.float16,1152,128,7168,256,8,0,0,asm,11010+21101,947.3887
gfx938,int8_w8a8_block,torch.float16,1280,128,7168,256,8,0,0,asm,11010+21101,989.7032
gfx938,int8_w8a8_block,torch.float16,1408,128,7168,256,8,0,0,asm,11010+21101,1027.1273
gfx938,int8_w8a8_block,torch.float16,1536,128,7168,256,8,0,0,asm,12003+22000,1114.4521
gfx938,int8_w8a8_block,torch.float16,1664,128,7168,256,8,0,0,asm,11010+21101,1140.0913
gfx938,int8_w8a8_block,torch.float16,1792,128,7168,256,8,0,0,asm,11010+21101,1184.5465
gfx938,int8_w8a8_block,torch.float16,1920,128,7168,256,8,0,0,asm,11010+21101,1273.1973
gfx938,int8_w8a8_block,torch.float16,2048,128,7168,256,8,0,0,asm,11010+21101,1336.6726
gfx938,int8_w8a8_block,torch.float16,2304,128,7168,256,8,0,0,asm,11010+21101,1539.3524
gfx938,int8_w8a8_block,torch.float16,2560,128,7168,256,8,0,0,asm,11010+21101,1627.5191
gfx938,int8_w8a8_block,torch.float16,2816,128,7168,256,8,0,0,asm,11010+21101,1752.9816
gfx938,int8_w8a8_block,torch.float16,3072,128,7168,256,8,0,0,asm,13001+23000,1901.1188
gfx938,int8_w8a8_block,torch.float16,3328,128,7168,256,8,0,0,asm,13001+23000,1962.5907
gfx938,int8_w8a8_block,torch.float16,3584,128,7168,256,8,0,0,asm,13001+23000,2056.3314
gfx938,int8_w8a8_block,torch.float16,3840,128,7168,256,8,0,0,asm,11010+21101,2270.6892
gfx938,int8_w8a8_block,torch.float16,4096,128,7168,256,8,0,0,asm,11010+21101,2408.8532
gfx938,int8_w8a8_block,torch.float16,4608,128,7168,256,8,0,0,asm,11010+21101,2691.0561
gfx938,int8_w8a8_block,torch.float16,5120,128,7168,256,8,0,0,asm,11010+21101,2965.5062
gfx938,int8_w8a8_block,torch.float16,5632,128,7168,256,8,0,0,asm,11010+21101,3251.9283
gfx938,int8_w8a8_block,torch.float16,6144,128,7168,256,8,0,0,asm,11010+21101,3517.052
gfx938,int8_w8a8_block,torch.float16,6656,128,7168,256,8,0,0,asm,11010+21101,3746.5233
gfx938,int8_w8a8_block,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23000,3851.4442
gfx938,int8_w8a8_block,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23000,4036.2064
gfx938,int8_w8a8_block,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23000,4501.6442
gfx938,int8_w8a8_block,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23000,5499.8329
gfx938,int8_w8a8_block,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23000,6461.2996
gfx938,int8_w8a8_block,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23000,7436.1102
gfx938,int8_w8a8_block,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23000,8314.3413
gfx938,int8_w8a8_block,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23000,9069.6552
gfx938,int8_w8a8_block,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23000,12217.4681
gfx938,int8_w8a8_block,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23000,16002.2442
gfx938,int8_w8a8_block,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15681.4438
gfx938,int8_w8a8_block,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23000,23121.5792
gfx938,int8_w8a8_block,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23000,27056.9822
gfx938,int8_w8a8_block,torch.float16,65536,128,7168,256,8,0,0,asm,13001+23000,30905.7893
gfx938,int8_w8a8_block,torch.float16,1,256,7168,256,8,0,0,asm,10007+20000,77.6185
gfx938,int8_w8a8_block,torch.float16,2,256,7168,256,8,0,0,asm,10002+20000,105.9251
gfx938,int8_w8a8_block,torch.float16,3,256,7168,256,8,0,0,asm,10005+20000,140.3853
gfx938,int8_w8a8_block,torch.float16,4,256,7168,256,8,0,0,asm,10006+20000,168.6228
gfx938,int8_w8a8_block,torch.float16,5,256,7168,256,8,0,0,asm,10007+20000,214.0556
gfx938,int8_w8a8_block,torch.float16,6,256,7168,256,8,0,0,asm,10002+20000,230.3543
gfx938,int8_w8a8_block,torch.float16,7,256,7168,256,8,0,0,asm,10002+20000,238.9969
gfx938,int8_w8a8_block,torch.float16,8,256,7168,256,8,0,0,asm,10006+20000,251.8997
gfx938,int8_w8a8_block,torch.float16,9,256,7168,256,8,0,0,asm,10006+20000,267.6234
gfx938,int8_w8a8_block,torch.float16,10,256,7168,256,8,0,0,asm,10006+20000,285.4415
gfx938,int8_w8a8_block,torch.float16,11,256,7168,256,8,0,0,asm,10002+20000,333.1649
gfx938,int8_w8a8_block,torch.float16,12,256,7168,256,8,0,0,asm,10002+20000,344.0761
gfx938,int8_w8a8_block,torch.float16,13,256,7168,256,8,0,0,asm,10001+20000,349.9011
gfx938,int8_w8a8_block,torch.float16,14,256,7168,256,8,0,0,asm,10006+20000,365.0726
gfx938,int8_w8a8_block,torch.float16,15,256,7168,256,8,0,0,asm,10006+20000,368.4375
gfx938,int8_w8a8_block,torch.float16,16,256,7168,256,8,0,0,asm,10006+20000,377.921
gfx938,int8_w8a8_block,torch.float16,17,256,7168,256,8,0,0,asm,10005+20000,382.6404
gfx938,int8_w8a8_block,torch.float16,18,256,7168,256,8,0,0,asm,10005+20000,399.2173
gfx938,int8_w8a8_block,torch.float16,20,256,7168,256,8,0,0,asm,10006+20000,449.5929
gfx938,int8_w8a8_block,torch.float16,24,256,7168,256,8,0,0,asm,10006+20000,474.6303
gfx938,int8_w8a8_block,torch.float16,28,256,7168,256,8,0,0,asm,10006+20000,569.4063
gfx938,int8_w8a8_block,torch.float16,32,256,7168,256,8,0,0,asm,10006+20000,581.0038
gfx938,int8_w8a8_block,torch.float16,34,256,7168,256,8,0,0,asm,10006+20000,573.6796
gfx938,int8_w8a8_block,torch.float16,36,256,7168,256,8,0,0,asm,10006+20000,589.4773
gfx938,int8_w8a8_block,torch.float16,40,256,7168,256,8,0,0,asm,10006+20000,648.7822
gfx938,int8_w8a8_block,torch.float16,44,256,7168,256,8,0,0,asm,10006+20000,656.8404
gfx938,int8_w8a8_block,torch.float16,48,256,7168,256,8,0,0,asm,10006+20000,668.0452
gfx938,int8_w8a8_block,torch.float16,56,256,7168,256,8,0,0,asm,10006+20000,688.69
gfx938,int8_w8a8_block,torch.float16,64,256,7168,256,8,0,0,asm,10006+20000,745.0293
gfx938,int8_w8a8_block,torch.float16,68,256,7168,256,8,0,0,asm,10005+20000,796.2971
gfx938,int8_w8a8_block,torch.float16,72,256,7168,256,8,0,0,asm,10006+20000,769.4408
gfx938,int8_w8a8_block,torch.float16,80,256,7168,256,8,0,0,asm,10006+20000,793.9629
gfx938,int8_w8a8_block,torch.float16,88,256,7168,256,8,0,0,asm,10006+20000,789.2854
gfx938,int8_w8a8_block,torch.float16,96,256,7168,256,8,0,0,asm,10006+20000,784.1078
gfx938,int8_w8a8_block,torch.float16,104,256,7168,256,8,0,0,asm,10006+20000,807.4015
gfx938,int8_w8a8_block,torch.float16,112,256,7168,256,8,0,0,asm,10006+20000,808.7332
gfx938,int8_w8a8_block,torch.float16,128,256,7168,256,8,0,0,asm,10006+20000,822.8422
gfx938,int8_w8a8_block,torch.float16,144,256,7168,256,8,0,0,asm,10006+20000,864.7766
gfx938,int8_w8a8_block,torch.float16,160,256,7168,256,8,0,0,asm,10006+20000,870.1813
gfx938,int8_w8a8_block,torch.float16,192,256,7168,256,8,0,0,asm,10006+20000,880.6561
gfx938,int8_w8a8_block,torch.float16,224,256,7168,256,8,0,0,asm,10006+20000,896.0501
gfx938,int8_w8a8_block,torch.float16,256,256,7168,256,8,0,0,asm,10006+20000,903.3266
gfx938,int8_w8a8_block,torch.float16,320,256,7168,256,8,0,0,asm,10006+20000,925.3824
gfx938,int8_w8a8_block,torch.float16,384,256,7168,256,8,0,0,asm,10006+20000,944.2336
gfx938,int8_w8a8_block,torch.float16,448,256,7168,256,8,0,0,asm,11010+21000,1002.260
gfx938,int8_w8a8_block,torch.float16,512,256,7168,256,8,0,0,asm,11010+21000,1016.7371
gfx938,int8_w8a8_block,torch.float16,576,256,7168,256,8,0,0,asm,11010+21000,1038.1561
gfx938,int8_w8a8_block,torch.float16,640,256,7168,256,8,0,0,asm,11010+21000,1053.8022
gfx938,int8_w8a8_block,torch.float16,704,256,7168,256,8,0,0,asm,11010+21000,1065.2371
gfx938,int8_w8a8_block,torch.float16,768,256,7168,256,8,0,0,asm,11010+21000,1086.4834
gfx938,int8_w8a8_block,torch.float16,832,256,7168,256,8,0,0,asm,11010+21000,1097.2841
gfx938,int8_w8a8_block,torch.float16,896,256,7168,256,8,0,0,asm,11010+21000,1173.5599
gfx938,int8_w8a8_block,torch.float16,960,256,7168,256,8,0,0,asm,11010+21000,1268.5115
gfx938,int8_w8a8_block,torch.float16,1024,256,7168,256,8,0,0,asm,11010+21000,1379.5732
gfx938,int8_w8a8_block,torch.float16,1152,256,7168,256,8,0,0,asm,12003+22000,1498.5623
gfx938,int8_w8a8_block,torch.float16,1280,256,7168,256,8,0,0,asm,12003+22000,1532.3256
gfx938,int8_w8a8_block,torch.float16,1408,256,7168,256,8,0,0,asm,12003+22000,1544.3759
gfx938,int8_w8a8_block,torch.float16,1536,256,7168,256,8,0,0,asm,12003+22000,1583.7134
gfx938,int8_w8a8_block,torch.float16,1664,256,7168,256,8,0,0,asm,12003+22000,1621.6496
gfx938,int8_w8a8_block,torch.float16,1792,256,7168,256,8,0,0,asm,12003+22000,1779.0828
gfx938,int8_w8a8_block,torch.float16,1920,256,7168,256,8,0,0,asm,12003+22000,1871.3132
gfx938,int8_w8a8_block,torch.float16,2048,256,7168,256,8,0,0,asm,12003+22000,2157.311
gfx938,int8_w8a8_block,torch.float16,2304,256,7168,256,8,0,0,asm,13001+23000,2490.01
gfx938,int8_w8a8_block,torch.float16,2560,256,7168,256,8,0,0,asm,13001+23000,2534.3288
gfx938,int8_w8a8_block,torch.float16,2816,256,7168,256,8,0,0,asm,13001+23000,2579.0659
gfx938,int8_w8a8_block,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23000,2653.1717
gfx938,int8_w8a8_block,torch.float16,3328,256,7168,256,8,0,0,asm,13001+23000,2745.7236
gfx938,int8_w8a8_block,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23000,2851.2956
gfx938,int8_w8a8_block,torch.float16,3840,256,7168,256,8,0,0,asm,13001+23000,3127.3154
gfx938,int8_w8a8_block,torch.float16,4096,256,7168,256,8,0,0,asm,13001+23000,3611.17
gfx938,int8_w8a8_block,torch.float16,4608,256,7168,256,8,0,0,asm,12003+22000,4208.9501
gfx938,int8_w8a8_block,torch.float16,5120,256,7168,256,8,0,0,asm,12003+22000,4453.8108
gfx938,int8_w8a8_block,torch.float16,5632,256,7168,256,8,0,0,asm,12003+22000,4666.0811
gfx938,int8_w8a8_block,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23000,4965.1708
gfx938,int8_w8a8_block,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23000,5061.4082
gfx938,int8_w8a8_block,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23000,5175.7386
gfx938,int8_w8a8_block,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23000,5490.6364
gfx938,int8_w8a8_block,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23000,6144.4436
gfx938,int8_w8a8_block,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23000,7471.2098
gfx938,int8_w8a8_block,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23000,8680.1129
gfx938,int8_w8a8_block,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23000,10012.1071
gfx938,int8_w8a8_block,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23000,11238.8407
gfx938,int8_w8a8_block,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23000,12274.2076
gfx938,int8_w8a8_block,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23000,16393.0752
gfx938,int8_w8a8_block,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23000,21424.9168
gfx938,int8_w8a8_block,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23000,25835.4239
gfx938,int8_w8a8_block,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23000,30968.2254
gfx938,int8_w8a8_block,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23000,36235.786
gfx938,int8_w8a8_block,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23000,41438.8945
gfx938,f8_w8a8_block,torch.float16,1,128,7168,256,8,0,0,asm,10008+20100,66.5653
gfx938,f8_w8a8_block,torch.float16,2,128,7168,256,8,0,0,asm,10007+20101,75.3486
gfx938,f8_w8a8_block,torch.float16,3,128,7168,256,8,0,0,asm,10002+20101,87.5783
gfx938,f8_w8a8_block,torch.float16,4,128,7168,256,8,0,0,asm,10002+20101,101.6294
gfx938,f8_w8a8_block,torch.float16,5,128,7168,256,8,0,0,asm,10006+20101,130.0846
gfx938,f8_w8a8_block,torch.float16,6,128,7168,256,8,0,0,asm,10005+20101,131.9144
gfx938,f8_w8a8_block,torch.float16,7,128,7168,256,8,0,0,asm,10006+20101,139.9513
gfx938,f8_w8a8_block,torch.float16,8,128,7168,256,8,0,0,asm,10006+20101,142.8436
gfx938,f8_w8a8_block,torch.float16,9,128,7168,256,8,0,0,asm,10006+20101,160.0702
gfx938,f8_w8a8_block,torch.float16,10,128,7168,256,8,0,0,asm,10006+20101,176.2466
gfx938,f8_w8a8_block,torch.float16,11,128,7168,256,8,0,0,asm,10007+20101,212.2792
gfx938,f8_w8a8_block,torch.float16,12,128,7168,256,8,0,0,asm,10007+20101,215.5613
gfx938,f8_w8a8_block,torch.float16,13,128,7168,256,8,0,0,asm,10007+20101,218.7449
gfx938,f8_w8a8_block,torch.float16,14,128,7168,256,8,0,0,asm,10001+20101,223.9592
gfx938,f8_w8a8_block,torch.float16,15,128,7168,256,8,0,0,asm,10002+20101,225.4525
gfx938,f8_w8a8_block,torch.float16,16,128,7168,256,8,0,0,asm,10002+20101,233.5714
gfx938,f8_w8a8_block,torch.float16,17,128,7168,256,8,0,0,asm,10002+20101,228.9449
gfx938,f8_w8a8_block,torch.float16,18,128,7168,256,8,0,0,asm,11006+21101,244.153
gfx938,f8_w8a8_block,torch.float16,20,128,7168,256,8,0,0,asm,10006+20101,259.0782
gfx938,f8_w8a8_block,torch.float16,24,128,7168,256,8,0,0,asm,10006+20101,281.4083
gfx938,f8_w8a8_block,torch.float16,28,128,7168,256,8,0,0,asm,10007+20101,353.9607
gfx938,f8_w8a8_block,torch.float16,32,128,7168,256,8,0,0,asm,10002+20101,363.335
gfx938,f8_w8a8_block,torch.float16,34,128,7168,256,8,0,0,asm,10002+20101,352.4438
gfx938,f8_w8a8_block,torch.float16,36,128,7168,256,8,0,0,asm,10002+20101,360.4028
gfx938,f8_w8a8_block,torch.float16,40,128,7168,256,8,0,0,asm,10006+20101,377.2437
gfx938,f8_w8a8_block,torch.float16,44,128,7168,256,8,0,0,asm,10006+20101,381.695
gfx938,f8_w8a8_block,torch.float16,48,128,7168,256,8,0,0,asm,10006+20101,387.1144
gfx938,f8_w8a8_block,torch.float16,56,128,7168,256,8,0,0,asm,10006+20101,403.1349
gfx938,f8_w8a8_block,torch.float16,64,128,7168,256,8,0,0,asm,10001+20101,451.6721
gfx938,f8_w8a8_block,torch.float16,68,128,7168,256,8,0,0,asm,10007+20101,469.6886
gfx938,f8_w8a8_block,torch.float16,72,128,7168,256,8,0,0,asm,10007+20101,473.0217
gfx938,f8_w8a8_block,torch.float16,80,128,7168,256,8,0,0,asm,10007+20101,476.11
gfx938,f8_w8a8_block,torch.float16,88,128,7168,256,8,0,0,asm,11006+21101,488.6581
gfx938,f8_w8a8_block,torch.float16,96,128,7168,256,8,0,0,asm,10002+20101,487.6638
gfx938,f8_w8a8_block,torch.float16,104,128,7168,256,8,0,0,asm,10006+20101,493.3294
gfx938,f8_w8a8_block,torch.float16,112,128,7168,256,8,0,0,asm,10006+20101,494.3222
gfx938,f8_w8a8_block,torch.float16,128,128,7168,256,8,0,0,asm,10006+20101,498.2566
gfx938,f8_w8a8_block,torch.float16,144,128,7168,256,8,0,0,asm,10006+20101,520.7139
gfx938,f8_w8a8_block,torch.float16,160,128,7168,256,8,0,0,asm,10006+20101,517.3169
gfx938,f8_w8a8_block,torch.float16,192,128,7168,256,8,0,0,asm,10006+20101,525.3252
gfx938,f8_w8a8_block,torch.float16,224,128,7168,256,8,0,0,asm,10006+20101,531.1508
gfx938,f8_w8a8_block,torch.float16,256,128,7168,256,8,0,0,asm,10006+20101,539.0933
gfx938,f8_w8a8_block,torch.float16,320,128,7168,256,8,0,0,asm,10006+20101,546.1825
gfx938,f8_w8a8_block,torch.float16,384,128,7168,256,8,0,0,asm,10006+20101,555.8809
gfx938,f8_w8a8_block,torch.float16,448,128,7168,256,8,0,0,asm,10006+20101,604.7094
gfx938,f8_w8a8_block,torch.float16,512,128,7168,256,8,0,0,asm,11010+21101,625.7268
gfx938,f8_w8a8_block,torch.float16,576,128,7168,256,8,0,0,asm,11010+21101,636.9596
gfx938,f8_w8a8_block,torch.float16,640,128,7168,256,8,0,0,asm,11010+21101,649.7718
gfx938,f8_w8a8_block,torch.float16,704,128,7168,256,8,0,0,asm,11010+21101,657.3738
gfx938,f8_w8a8_block,torch.float16,768,128,7168,256,8,0,0,asm,11010+21101,664.6107
gfx938,f8_w8a8_block,torch.float16,832,128,7168,256,8,0,0,asm,11010+21101,670.8138
gfx938,f8_w8a8_block,torch.float16,896,128,7168,256,8,0,0,asm,11010+21101,737.3488
gfx938,f8_w8a8_block,torch.float16,960,128,7168,256,8,0,0,asm,11010+21101,748.9636
gfx938,f8_w8a8_block,torch.float16,1024,128,7168,256,8,0,0,asm,11010+21101,825.1375
gfx938,f8_w8a8_block,torch.float16,1152,128,7168,256,8,0,0,asm,11010+21101,941.7131
gfx938,f8_w8a8_block,torch.float16,1280,128,7168,256,8,0,0,asm,11010+21101,981.3457
gfx938,f8_w8a8_block,torch.float16,1408,128,7168,256,8,0,0,asm,11010+21101,1017.7776
gfx938,f8_w8a8_block,torch.float16,1536,128,7168,256,8,0,0,asm,12003+22000,1084.6548
gfx938,f8_w8a8_block,torch.float16,1664,128,7168,256,8,0,0,asm,12003+22000,1110.2295
gfx938,f8_w8a8_block,torch.float16,1792,128,7168,256,8,0,0,asm,11010+21101,1184.1491
gfx938,f8_w8a8_block,torch.float16,1920,128,7168,256,8,0,0,asm,11010+21101,1268.0833
gfx938,f8_w8a8_block,torch.float16,2048,128,7168,256,8,0,0,asm,11010+21101,1327.7161
gfx938,f8_w8a8_block,torch.float16,2304,128,7168,256,8,0,0,asm,11010+21101,1537.3458
gfx938,f8_w8a8_block,torch.float16,2560,128,7168,256,8,0,0,asm,11010+21101,1623.1556
gfx938,f8_w8a8_block,torch.float16,2816,128,7168,256,8,0,0,asm,11010+21101,1743.6874
gfx938,f8_w8a8_block,torch.float16,3072,128,7168,256,8,0,0,asm,13001+23000,1801.0634
gfx938,f8_w8a8_block,torch.float16,3328,128,7168,256,8,0,0,asm,13001+23000,1867.9686
gfx938,f8_w8a8_block,torch.float16,3584,128,7168,256,8,0,0,asm,13001+23000,1962.0926
gfx938,f8_w8a8_block,torch.float16,3840,128,7168,256,8,0,0,asm,13001+23000,2202.7211
gfx938,f8_w8a8_block,torch.float16,4096,128,7168,256,8,0,0,asm,11010+21101,2395.3579
gfx938,f8_w8a8_block,torch.float16,4608,128,7168,256,8,0,0,asm,11010+21101,2679.7118
gfx938,f8_w8a8_block,torch.float16,5120,128,7168,256,8,0,0,asm,11010+21101,2954.1683
gfx938,f8_w8a8_block,torch.float16,5632,128,7168,256,8,0,0,asm,12003+22000,3219.4688
gfx938,f8_w8a8_block,torch.float16,6144,128,7168,256,8,0,0,asm,14001+24000,3479.9218
gfx938,f8_w8a8_block,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23000,3570.5668
gfx938,f8_w8a8_block,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23000,3670.2289
gfx938,f8_w8a8_block,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23000,3839.9203
gfx938,f8_w8a8_block,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23000,4282.3809
gfx938,f8_w8a8_block,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23000,5219.3544
gfx938,f8_w8a8_block,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23000,6140.1191
gfx938,f8_w8a8_block,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23000,7078.5975
gfx938,f8_w8a8_block,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23000,7927.4133
gfx938,f8_w8a8_block,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23000,8632.191
gfx938,f8_w8a8_block,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23000,11640.6421
gfx938,f8_w8a8_block,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23000,15245.6187
gfx938,f8_w8a8_block,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15088.5354
gfx938,f8_w8a8_block,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23000,21967.1596
gfx938,f8_w8a8_block,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23000,25747.9781
gfx938,f8_w8a8_block,torch.float16,65536,128,7168,256,8,0,0,asm,13001+23000,29469.4784
gfx938,f8_w8a8_block,torch.float16,1,256,7168,256,8,0,0,asm,10007+20200,77.7863
gfx938,f8_w8a8_block,torch.float16,2,256,7168,256,8,0,0,asm,10002+20000,108.981
gfx938,f8_w8a8_block,torch.float16,3,256,7168,256,8,0,0,asm,10006+20000,140.2978
gfx938,f8_w8a8_block,torch.float16,4,256,7168,256,8,0,0,asm,10006+20000,166.45
gfx938,f8_w8a8_block,torch.float16,5,256,7168,256,8,0,0,asm,10007+20000,212.665
gfx938,f8_w8a8_block,torch.float16,6,256,7168,256,8,0,0,asm,10002+20000,222.8202
gfx938,f8_w8a8_block,torch.float16,7,256,7168,256,8,0,0,asm,10001+20000,239.1831
gfx938,f8_w8a8_block,torch.float16,8,256,7168,256,8,0,0,asm,10006+20000,252.5874
gfx938,f8_w8a8_block,torch.float16,9,256,7168,256,8,0,0,asm,10006+20000,265.8496
gfx938,f8_w8a8_block,torch.float16,10,256,7168,256,8,0,0,asm,10006+20000,284.6495
gfx938,f8_w8a8_block,torch.float16,11,256,7168,256,8,0,0,asm,10002+20000,331.5774
gfx938,f8_w8a8_block,torch.float16,12,256,7168,256,8,0,0,asm,10002+20000,338.8226
gfx938,f8_w8a8_block,torch.float16,13,256,7168,256,8,0,0,asm,10001+20000,348.3648
gfx938,f8_w8a8_block,torch.float16,14,256,7168,256,8,0,0,asm,10006+20000,362.2937
gfx938,f8_w8a8_block,torch.float16,15,256,7168,256,8,0,0,asm,10006+20000,370.0803
gfx938,f8_w8a8_block,torch.float16,16,256,7168,256,8,0,0,asm,10006+20000,374.9336
gfx938,f8_w8a8_block,torch.float16,17,256,7168,256,8,0,0,asm,10006+20000,380.9883
gfx938,f8_w8a8_block,torch.float16,18,256,7168,256,8,0,0,asm,10006+20000,395.6061
gfx938,f8_w8a8_block,torch.float16,20,256,7168,256,8,0,0,asm,10006+20000,451.4192
gfx938,f8_w8a8_block,torch.float16,24,256,7168,256,8,0,0,asm,10006+20000,475.0546
gfx938,f8_w8a8_block,torch.float16,28,256,7168,256,8,0,0,asm,10006+20000,567.282
gfx938,f8_w8a8_block,torch.float16,32,256,7168,256,8,0,0,asm,10006+20000,578.7283
gfx938,f8_w8a8_block,torch.float16,34,256,7168,256,8,0,0,asm,10006+20000,575.8412
gfx938,f8_w8a8_block,torch.float16,36,256,7168,256,8,0,0,asm,10006+20000,589.5386
gfx938,f8_w8a8_block,torch.float16,40,256,7168,256,8,0,0,asm,10006+20000,648.6628
gfx938,f8_w8a8_block,torch.float16,44,256,7168,256,8,0,0,asm,10006+20000,658.6983
gfx938,f8_w8a8_block,torch.float16,48,256,7168,256,8,0,0,asm,10006+20000,665.4139
gfx938,f8_w8a8_block,torch.float16,56,256,7168,256,8,0,0,asm,10006+20000,684.4388
gfx938,f8_w8a8_block,torch.float16,64,256,7168,256,8,0,0,asm,10006+20000,741.6224
gfx938,f8_w8a8_block,torch.float16,68,256,7168,256,8,0,0,asm,10006+20000,751.4839
gfx938,f8_w8a8_block,torch.float16,72,256,7168,256,8,0,0,asm,10004+20000,767.0313
gfx938,f8_w8a8_block,torch.float16,80,256,7168,256,8,0,0,asm,11010+21000,811.3511
gfx938,f8_w8a8_block,torch.float16,88,256,7168,256,8,0,0,asm,10006+20000,790.4088
gfx938,f8_w8a8_block,torch.float16,96,256,7168,256,8,0,0,asm,10006+20000,783.8489
gfx938,f8_w8a8_block,torch.float16,104,256,7168,256,8,0,0,asm,10006+20000,808.2379
gfx938,f8_w8a8_block,torch.float16,112,256,7168,256,8,0,0,asm,10006+20000,811.6932
gfx938,f8_w8a8_block,torch.float16,128,256,7168,256,8,0,0,asm,10006+20000,822.2664
gfx938,f8_w8a8_block,torch.float16,144,256,7168,256,8,0,0,asm,10006+20000,864.5257
gfx938,f8_w8a8_block,torch.float16,160,256,7168,256,8,0,0,asm,10006+20000,870.8529
gfx938,f8_w8a8_block,torch.float16,192,256,7168,256,8,0,0,asm,10006+20000,882.0707
gfx938,f8_w8a8_block,torch.float16,224,256,7168,256,8,0,0,asm,10006+20000,896.5011
gfx938,f8_w8a8_block,torch.float16,256,256,7168,256,8,0,0,asm,10006+20000,905.1327
gfx938,f8_w8a8_block,torch.float16,320,256,7168,256,8,0,0,asm,10006+20000,923.0352
gfx938,f8_w8a8_block,torch.float16,384,256,7168,256,8,0,0,asm,10006+20000,943.2565
gfx938,f8_w8a8_block,torch.float16,448,256,7168,256,8,0,0,asm,11010+21000,988.6851
gfx938,f8_w8a8_block,torch.float16,512,256,7168,256,8,0,0,asm,11010+21000,1011.6567
gfx938,f8_w8a8_block,torch.float16,576,256,7168,256,8,0,0,asm,11010+21000,1028.3101
gfx938,f8_w8a8_block,torch.float16,640,256,7168,256,8,0,0,asm,11010+21000,1040.4231
gfx938,f8_w8a8_block,torch.float16,704,256,7168,256,8,0,0,asm,11010+21000,1062.4813
gfx938,f8_w8a8_block,torch.float16,768,256,7168,256,8,0,0,asm,11010+21000,1077.4394
gfx938,f8_w8a8_block,torch.float16,832,256,7168,256,8,0,0,asm,11010+21000,1089.0687
gfx938,f8_w8a8_block,torch.float16,896,256,7168,256,8,0,0,asm,11010+21000,1155.8735
gfx938,f8_w8a8_block,torch.float16,960,256,7168,256,8,0,0,asm,11010+21000,1248.7023
gfx938,f8_w8a8_block,torch.float16,1024,256,7168,256,8,0,0,asm,11010+21000,1354.4664
gfx938,f8_w8a8_block,torch.float16,1152,256,7168,256,8,0,0,asm,12003+22000,1419.539
gfx938,f8_w8a8_block,torch.float16,1280,256,7168,256,8,0,0,asm,12003+22000,1460.1541
gfx938,f8_w8a8_block,torch.float16,1408,256,7168,256,8,0,0,asm,12003+22000,1472.3131
gfx938,f8_w8a8_block,torch.float16,1536,256,7168,256,8,0,0,asm,12003+22000,1503.9613
gfx938,f8_w8a8_block,torch.float16,1664,256,7168,256,8,0,0,asm,12003+22000,1542.3411
gfx938,f8_w8a8_block,torch.float16,1792,256,7168,256,8,0,0,asm,12003+22000,1692.1873
gfx938,f8_w8a8_block,torch.float16,1920,256,7168,256,8,0,0,asm,12003+22000,1780.018
gfx938,f8_w8a8_block,torch.float16,2048,256,7168,256,8,0,0,asm,12003+22000,2044.5118
gfx938,f8_w8a8_block,torch.float16,2304,256,7168,256,8,0,0,asm,13001+23000,2335.2539
gfx938,f8_w8a8_block,torch.float16,2560,256,7168,256,8,0,0,asm,13001+23000,2437.9238
gfx938,f8_w8a8_block,torch.float16,2816,256,7168,256,8,0,0,asm,13001+23000,2511.6265
gfx938,f8_w8a8_block,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23000,2562.9169
gfx938,f8_w8a8_block,torch.float16,3328,256,7168,256,8,0,0,asm,13001+23000,2649.1537
gfx938,f8_w8a8_block,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23000,2733.0184
gfx938,f8_w8a8_block,torch.float16,3840,256,7168,256,8,0,0,asm,13001+23000,2959.8084
gfx938,f8_w8a8_block,torch.float16,4096,256,7168,256,8,0,0,asm,13001+23000,3382.3163
gfx938,f8_w8a8_block,torch.float16,4608,256,7168,256,8,0,0,asm,12003+22000,3998.149
gfx938,f8_w8a8_block,torch.float16,5120,256,7168,256,8,0,0,asm,12003+22000,4229.2055
gfx938,f8_w8a8_block,torch.float16,5632,256,7168,256,8,0,0,asm,12003+22000,4436.4858
gfx938,f8_w8a8_block,torch.float16,6144,256,7168,256,8,0,0,asm,13001+23000,4671.2596
gfx938,f8_w8a8_block,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23000,4781.0715
gfx938,f8_w8a8_block,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23000,4890.9133
gfx938,f8_w8a8_block,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23000,5179.0355
gfx938,f8_w8a8_block,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23000,5775.563
gfx938,f8_w8a8_block,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23000,7044.6425
gfx938,f8_w8a8_block,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23000,8183.457
gfx938,f8_w8a8_block,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23000,9436.2243
gfx938,f8_w8a8_block,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23000,10631.6376
gfx938,f8_w8a8_block,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23000,11551.5316
gfx938,f8_w8a8_block,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23000,15473.3602
gfx938,f8_w8a8_block,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23000,20238.4598
gfx938,f8_w8a8_block,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23000,24225.5718
gfx938,f8_w8a8_block,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23000,29117.2928
gfx938,f8_w8a8_block,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23000,34120.5525
gfx938,f8_w8a8_block,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23000,39073.9223
gfx938,f8_w8a8_block,torch.float16,1,256,7168,257,9,0,0,asm,10007+20000,76.1697
gfx938,f8_w8a8_block,torch.float16,2,256,7168,257,9,0,0,asm,10002+20000,106.8558
gfx938,f8_w8a8_block,torch.float16,4,256,7168,257,9,0,0,asm,10006+20000,162.4684
gfx938,f8_w8a8_block,torch.float16,6,256,7168,257,9,0,0,asm,10002+20000,219.2933
gfx938,f8_w8a8_block,torch.float16,8,256,7168,257,9,0,0,asm,10006+20000,263.1334
gfx938,f8_w8a8_block,torch.float16,12,256,7168,257,9,0,0,asm,10001+20000,357.1709
gfx938,f8_w8a8_block,torch.float16,16,256,7168,257,9,0,0,asm,10002+20000,446.2233
gfx938,f8_w8a8_block,torch.float16,20,256,7168,257,9,0,0,asm,10006+20200,499.2896
gfx938,f8_w8a8_block,torch.float16,24,256,7168,257,9,0,0,asm,10002+20200,569.8494
gfx938,f8_w8a8_block,torch.float16,28,256,7168,257,9,0,0,asm,10002+20200,620.7912
gfx938,f8_w8a8_block,torch.float16,32,256,7168,257,9,0,0,asm,10006+20200,634.5932
gfx938,f8_w8a8_block,torch.float16,36,256,7168,257,9,0,0,asm,10002+20200,683.0027
gfx938,f8_w8a8_block,torch.float16,40,256,7168,257,9,0,0,asm,10002+20200,697.5795
gfx938,f8_w8a8_block,torch.float16,44,256,7168,257,9,0,0,asm,10002+20200,710.9268
gfx938,f8_w8a8_block,torch.float16,48,256,7168,257,9,0,0,asm,10006+20200,739.6425
gfx938,f8_w8a8_block,torch.float16,56,256,7168,257,9,0,0,asm,10002+20200,808.7286
gfx938,f8_w8a8_block,torch.float16,64,256,7168,257,9,0,0,asm,10002+20200,819.6086
gfx938,f8_w8a8_block,torch.float16,72,256,7168,257,9,0,0,asm,10006+20000,842.918
gfx938,f8_w8a8_block,torch.float16,80,256,7168,257,9,0,0,asm,10006+20000,853.7896
gfx938,f8_w8a8_block,torch.float16,96,256,7168,257,9,0,0,asm,10006+20000,883.76
gfx938,f8_w8a8_block,torch.float16,104,256,7168,257,9,0,0,asm,10006+20000,887.9284
gfx938,f8_w8a8_block,torch.float16,112,256,7168,257,9,0,0,asm,10002+20000,904.5767
gfx938,f8_w8a8_block,torch.float16,128,256,7168,257,9,0,0,asm,10002+20000,924.9725
gfx938,f8_w8a8_block,torch.float16,144,256,7168,257,9,0,0,asm,10002+20200,932.5766
gfx938,f8_w8a8_block,torch.float16,160,256,7168,257,9,0,0,asm,10002+20200,939.3472
gfx938,f8_w8a8_block,torch.float16,192,256,7168,257,9,0,0,asm,10002+20200,951.3051
gfx938,f8_w8a8_block,torch.float16,224,256,7168,257,9,0,0,asm,10002+20200,957.4777
gfx938,f8_w8a8_block,torch.float16,256,256,7168,257,9,0,0,asm,10002+20200,967.1197
gfx938,f8_w8a8_block,torch.float16,320,256,7168,257,9,0,0,asm,10006+20200,974.9429
gfx938,f8_w8a8_block,torch.float16,384,256,7168,257,9,0,0,asm,10006+20200,1016.8207
gfx938,f8_w8a8_block,torch.float16,448,256,7168,257,9,0,0,asm,11010+21200,1045.5112
gfx938,f8_w8a8_block,torch.float16,512,256,7168,257,9,0,0,asm,11010+21000,1080.2647
gfx938,f8_w8a8_block,torch.float16,768,256,7168,257,9,0,0,asm,11010+21000,1161.0055
gfx938,f8_w8a8_block,torch.float16,896,256,7168,257,9,0,0,asm,11010+21200,1271.7673
gfx938,f8_w8a8_block,torch.float16,960,256,7168,257,9,0,0,asm,12003+22000,1399.2027
gfx938,f8_w8a8_block,torch.float16,1024,256,7168,257,9,0,0,asm,12003+22000,1453.5352
gfx938,f8_w8a8_block,torch.float16,1280,256,7168,257,9,0,0,asm,12003+22000,1460.8194
gfx938,f8_w8a8_block,torch.float16,1536,256,7168,257,9,0,0,asm,12003+22000,1538.6213
gfx938,f8_w8a8_block,torch.float16,1920,256,7168,257,9,0,0,asm,12003+22000,2139.9837
gfx938,f8_w8a8_block,torch.float16,2048,256,7168,257,9,0,0,asm,12003+22000,2323.3095
gfx938,f8_w8a8_block,torch.float16,2304,256,7168,257,9,0,0,asm,13001+23000,2408.0251
gfx938,f8_w8a8_block,torch.float16,2560,256,7168,257,9,0,0,asm,13001+23000,2462.8459
gfx938,f8_w8a8_block,torch.float16,3072,256,7168,257,9,0,0,asm,13001+23000,2576.1508
gfx938,f8_w8a8_block,torch.float16,3584,256,7168,257,9,0,0,asm,13001+23000,3054.2211
gfx938,f8_w8a8_block,torch.float16,3840,256,7168,257,9,0,0,asm,12005+22000,3551.4827
gfx938,f8_w8a8_block,torch.float16,4096,256,7168,257,9,0,0,asm,12005+22000,3749.5706
gfx938,f8_w8a8_block,torch.float16,4608,256,7168,257,9,0,0,asm,12005+22000,3981.5614
gfx938,f8_w8a8_block,torch.float16,5120,256,7168,257,9,0,0,asm,12005+22000,4231.3544
gfx938,f8_w8a8_block,torch.float16,6144,256,7168,257,9,0,0,asm,13001+23000,4610.5283
gfx938,f8_w8a8_block,torch.float16,7168,256,7168,257,9,0,0,asm,13001+23000,5281.9533
gfx938,f8_w8a8_block,torch.float16,8192,256,7168,257,9,0,0,asm,13001+23000,6427.1963
gfx938,f8_w8a8_block,torch.float16,10240,256,7168,257,9,0,0,asm,13001+23000,7069.4428
gfx938,f8_w8a8_block,torch.float16,12288,256,7168,257,9,0,0,asm,14001+24000,8706.9454
gfx938,f8_w8a8_block,torch.float16,16384,256,7168,257,9,0,0,asm,13001+23000,11135.1487
gfx938,f8_w8a8_block,torch.float16,24576,256,7168,257,9,0,0,asm,13001+23000,15944.6083
gfx938,f8_w8a8_block,torch.float16,32768,256,7168,257,9,0,0,asm,13001+23000,21105.1667
gfx938,f8_w8a8_block,torch.float16,1,256,6144,256,8,0,0,asm,10007+20000,65.1802
gfx938,f8_w8a8_block,torch.float16,2,256,6144,256,8,0,0,asm,10002+20000,89.8117
gfx938,f8_w8a8_block,torch.float16,4,256,6144,256,8,0,0,asm,10006+20000,134.7546
gfx938,f8_w8a8_block,torch.float16,6,256,6144,256,8,0,0,asm,10002+20000,188.1102
gfx938,f8_w8a8_block,torch.float16,8,256,6144,256,8,0,0,asm,10006+20000,214.1985
gfx938,f8_w8a8_block,torch.float16,12,256,6144,256,8,0,0,asm,10002+20000,292.6573
gfx938,f8_w8a8_block,torch.float16,16,256,6144,256,8,0,0,asm,10006+20000,334.1645
gfx938,f8_w8a8_block,torch.float16,20,256,6144,256,8,0,0,asm,10002+20000,400.2413
gfx938,f8_w8a8_block,torch.float16,24,256,6144,256,8,0,0,asm,10006+20000,440.0895
gfx938,f8_w8a8_block,torch.float16,28,256,6144,256,8,0,0,asm,10002+20000,515.9659
gfx938,f8_w8a8_block,torch.float16,32,256,6144,256,8,0,0,asm,10006+20200,536.2101
gfx938,f8_w8a8_block,torch.float16,36,256,6144,256,8,0,0,asm,10006+20200,551.8786
gfx938,f8_w8a8_block,torch.float16,40,256,6144,256,8,0,0,asm,10002+20200,592.7795
gfx938,f8_w8a8_block,torch.float16,44,256,6144,256,8,0,0,asm,10002+20200,603.8279
gfx938,f8_w8a8_block,torch.float16,48,256,6144,256,8,0,0,asm,10006+20200,622.2699
gfx938,f8_w8a8_block,torch.float16,56,256,6144,256,8,0,0,asm,10006+20000,643.0614
gfx938,f8_w8a8_block,torch.float16,64,256,6144,256,8,0,0,asm,10002+20200,678.5897
gfx938,f8_w8a8_block,torch.float16,72,256,6144,256,8,0,0,asm,10002+20000,698.1938
gfx938,f8_w8a8_block,torch.float16,80,256,6144,256,8,0,0,asm,10002+20000,710.8506
gfx938,f8_w8a8_block,torch.float16,96,256,6144,256,8,0,0,asm,10006+20200,736.1979
gfx938,f8_w8a8_block,torch.float16,104,256,6144,256,8,0,0,asm,10006+20200,743.8105
gfx938,f8_w8a8_block,torch.float16,112,256,6144,256,8,0,0,asm,10006+20200,752.2147
gfx938,f8_w8a8_block,torch.float16,128,256,6144,256,8,0,0,asm,10002+20000,762.1599
gfx938,f8_w8a8_block,torch.float16,144,256,6144,256,8,0,0,asm,10002+20000,781.7557
gfx938,f8_w8a8_block,torch.float16,160,256,6144,256,8,0,0,asm,10002+20200,796.2398
gfx938,f8_w8a8_block,torch.float16,192,256,6144,256,8,0,0,asm,10002+20200,803.1787
gfx938,f8_w8a8_block,torch.float16,224,256,6144,256,8,0,0,asm,10002+20200,809.4272
gfx938,f8_w8a8_block,torch.float16,256,256,6144,256,8,0,0,asm,10002+20200,814.3955
gfx938,f8_w8a8_block,torch.float16,320,256,6144,256,8,0,0,asm,10002+20200,832.5007
gfx938,f8_w8a8_block,torch.float16,384,256,6144,256,8,0,0,asm,10006+20200,842.3365
gfx938,f8_w8a8_block,torch.float16,448,256,6144,256,8,0,0,asm,10006+20000,883.2795
gfx938,f8_w8a8_block,torch.float16,512,256,6144,256,8,0,0,asm,11009+21000,918.4626
gfx938,f8_w8a8_block,torch.float16,768,256,6144,256,8,0,0,asm,11010+21200,988.1044
gfx938,f8_w8a8_block,torch.float16,896,256,6144,256,8,0,0,asm,11010+21200,1011.2959
gfx938,f8_w8a8_block,torch.float16,960,256,6144,256,8,0,0,asm,11010+21200,1078.3104
gfx938,f8_w8a8_block,torch.float16,1024,256,6144,256,8,0,0,asm,11010+21000,1170.7396
gfx938,f8_w8a8_block,torch.float16,1280,256,6144,256,8,0,0,asm,12003+22000,1247.3204
gfx938,f8_w8a8_block,torch.float16,1536,256,6144,256,8,0,0,asm,12003+22000,1302.6044
gfx938,f8_w8a8_block,torch.float16,1920,256,6144,256,8,0,0,asm,12003+22000,1482.9997
gfx938,f8_w8a8_block,torch.float16,2048,256,6144,256,8,0,0,asm,12003+22000,1709.5082
gfx938,f8_w8a8_block,torch.float16,2304,256,6144,256,8,0,0,asm,12003+22000,2042.7786
gfx938,f8_w8a8_block,torch.float16,2560,256,6144,256,8,0,0,asm,13001+23000,2084.2437
gfx938,f8_w8a8_block,torch.float16,3072,256,6144,256,8,0,0,asm,13001+23000,2171.3676
gfx938,f8_w8a8_block,torch.float16,3584,256,6144,256,8,0,0,asm,13001+23000,2271.7631
gfx938,f8_w8a8_block,torch.float16,3840,256,6144,256,8,0,0,asm,13001+23000,2448.1835
gfx938,f8_w8a8_block,torch.float16,4096,256,6144,256,8,0,0,asm,13001+23000,2797.9086
gfx938,f8_w8a8_block,torch.float16,4608,256,6144,256,8,0,0,asm,12005+22000,3283.8269
gfx938,f8_w8a8_block,torch.float16,5120,256,6144,256,8,0,0,asm,12005+22000,3498.3187
gfx938,f8_w8a8_block,torch.float16,6144,256,6144,256,8,0,0,asm,13001+23000,3881.1637
gfx938,f8_w8a8_block,torch.float16,7168,256,6144,256,8,0,0,asm,13001+23000,4041.6432
gfx938,f8_w8a8_block,torch.float16,8192,256,6144,256,8,0,0,asm,13001+23000,4767.1059
gfx938,f8_w8a8_block,torch.float16,10240,256,6144,256,8,0,0,asm,13001+23000,5883.4809
gfx938,f8_w8a8_block,torch.float16,12288,256,6144,256,8,0,0,asm,13001+23000,6685.2213
gfx938,f8_w8a8_block,torch.float16,16384,256,6144,256,8,0,0,asm,13001+23000,8614.1997
gfx938,f8_w8a8_block,torch.float16,24576,256,6144,256,8,0,0,asm,13001+23000,12547.1628
gfx938,f8_w8a8_block,torch.float16,32768,256,6144,256,8,0,0,asm,13001+23000,16452.4205
gfx938,f8_w8a8_block,torch.float16,1,256,6144,257,9,0,0,asm,10007+20000,71.3526
gfx938,f8_w8a8_block,torch.float16,2,256,6144,257,9,0,0,asm,10002+20000,96.1274
gfx938,f8_w8a8_block,torch.float16,4,256,6144,257,9,0,0,asm,10006+20000,142.9145
gfx938,f8_w8a8_block,torch.float16,6,256,6144,257,9,0,0,asm,10002+20000,195.2598
gfx938,f8_w8a8_block,torch.float16,8,256,6144,257,9,0,0,asm,10006+20000,227.8996
gfx938,f8_w8a8_block,torch.float16,12,256,6144,257,9,0,0,asm,10002+20000,310.8635
gfx938,f8_w8a8_block,torch.float16,16,256,6144,257,9,0,0,asm,10002+20000,395.5621
gfx938,f8_w8a8_block,torch.float16,20,256,6144,257,9,0,0,asm,10006+20000,433.4706
gfx938,f8_w8a8_block,torch.float16,24,256,6144,257,9,0,0,asm,10002+20200,498.9272
gfx938,f8_w8a8_block,torch.float16,28,256,6144,257,9,0,0,asm,10005+20200,540.3953
gfx938,f8_w8a8_block,torch.float16,32,256,6144,257,9,0,0,asm,10006+20200,549.3553
gfx938,f8_w8a8_block,torch.float16,36,256,6144,257,9,0,0,asm,10002+20200,591.5079
gfx938,f8_w8a8_block,torch.float16,40,256,6144,257,9,0,0,asm,10002+20200,603.2889
gfx938,f8_w8a8_block,torch.float16,44,256,6144,257,9,0,0,asm,10002+20200,615.2552
gfx938,f8_w8a8_block,torch.float16,48,256,6144,257,9,0,0,asm,10006+20000,638.8088
gfx938,f8_w8a8_block,torch.float16,56,256,6144,257,9,0,0,asm,10002+20200,698.1096
gfx938,f8_w8a8_block,torch.float16,64,256,6144,257,9,0,0,asm,10002+20200,706.2865
gfx938,f8_w8a8_block,torch.float16,72,256,6144,257,9,0,0,asm,10006+20000,730.6401
gfx938,f8_w8a8_block,torch.float16,80,256,6144,257,9,0,0,asm,10006+20000,741.5369
gfx938,f8_w8a8_block,torch.float16,96,256,6144,257,9,0,0,asm,10002+20000,762.0168
gfx938,f8_w8a8_block,torch.float16,104,256,6144,257,9,0,0,asm,10002+20000,775.5578
gfx938,f8_w8a8_block,torch.float16,112,256,6144,257,9,0,0,asm,10002+20000,779.8609
gfx938,f8_w8a8_block,torch.float16,128,256,6144,257,9,0,0,asm,10002+20200,790.1009
gfx938,f8_w8a8_block,torch.float16,144,256,6144,257,9,0,0,asm,10002+20200,798.8672
gfx938,f8_w8a8_block,torch.float16,160,256,6144,257,9,0,0,asm,10002+20000,806.9093
gfx938,f8_w8a8_block,torch.float16,192,256,6144,257,9,0,0,asm,10001+20200,813.0229
gfx938,f8_w8a8_block,torch.float16,224,256,6144,257,9,0,0,asm,10002+20200,822.6313
gfx938,f8_w8a8_block,torch.float16,256,256,6144,257,9,0,0,asm,10001+20200,833.3765
gfx938,f8_w8a8_block,torch.float16,320,256,6144,257,9,0,0,asm,10006+20200,849.2081
gfx938,f8_w8a8_block,torch.float16,384,256,6144,257,9,0,0,asm,10006+20000,880.9048
gfx938,f8_w8a8_block,torch.float16,448,256,6144,257,9,0,0,asm,11010+21200,913.6289
gfx938,f8_w8a8_block,torch.float16,512,256,6144,257,9,0,0,asm,11010+21200,981.9486
gfx938,f8_w8a8_block,torch.float16,768,256,6144,257,9,0,0,asm,11010+21000,979.4476
gfx938,f8_w8a8_block,torch.float16,896,256,6144,257,9,0,0,asm,11010+21200,1150.9585
gfx938,f8_w8a8_block,torch.float16,960,256,6144,257,9,0,0,asm,12003+22000,1219.0678
gfx938,f8_w8a8_block,torch.float16,1024,256,6144,257,9,0,0,asm,12003+22000,1272.1708
gfx938,f8_w8a8_block,torch.float16,1280,256,6144,257,9,0,0,asm,12003+22000,1270.6803
gfx938,f8_w8a8_block,torch.float16,1536,256,6144,257,9,0,0,asm,12003+22000,1338.1916
gfx938,f8_w8a8_block,torch.float16,1920,256,6144,257,9,0,0,asm,12003+22000,1876.4045
gfx938,f8_w8a8_block,torch.float16,2048,256,6144,257,9,0,0,asm,12003+22000,2017.7345
gfx938,f8_w8a8_block,torch.float16,2304,256,6144,257,9,0,0,asm,13001+23000,2088.9174
gfx938,f8_w8a8_block,torch.float16,2560,256,6144,257,9,0,0,asm,13001+23000,2126.6857
gfx938,f8_w8a8_block,torch.float16,3072,256,6144,257,9,0,0,asm,13001+23000,2241.6832
gfx938,f8_w8a8_block,torch.float16,3584,256,6144,257,9,0,0,asm,13001+23000,2649.9259
gfx938,f8_w8a8_block,torch.float16,3840,256,6144,257,9,0,0,asm,12005+22000,3052.4003
gfx938,f8_w8a8_block,torch.float16,4096,256,6144,257,9,0,0,asm,12005+22000,3290.1763
gfx938,f8_w8a8_block,torch.float16,4608,256,6144,257,9,0,0,asm,12005+22000,3497.8302
gfx938,f8_w8a8_block,torch.float16,5120,256,6144,257,9,0,0,asm,12005+22000,3640.676
gfx938,f8_w8a8_block,torch.float16,6144,256,6144,257,9,0,0,asm,13001+23000,3990.1233
gfx938,f8_w8a8_block,torch.float16,7168,256,6144,257,9,0,0,asm,13001+23000,4562.9129
gfx938,f8_w8a8_block,torch.float16,8192,256,6144,257,9,0,0,asm,13001+23000,5648.3743
gfx938,f8_w8a8_block,torch.float16,10240,256,6144,257,9,0,0,asm,13001+23000,6141.1557
gfx938,f8_w8a8_block,torch.float16,12288,256,6144,257,9,0,0,asm,14001+24000,7544.4518
gfx938,f8_w8a8_block,torch.float16,16384,256,6144,257,9,0,0,asm,13001+23000,9580.1329
gfx938,f8_w8a8_block,torch.float16,24576,256,6144,257,9,0,0,asm,13001+23000,13717.7858
gfx938,f8_w8a8_block,torch.float16,32768,256,6144,257,9,0,0,asm,13001+23000,18186.7557
gfx938,f8_w8a8_block,torch.float16,1,384,3072,256,8,0,0,asm,10002+20000,68.0432
gfx938,f8_w8a8_block,torch.float16,2,384,3072,256,8,0,0,asm,10005+20000,81.6263
gfx938,f8_w8a8_block,torch.float16,4,384,3072,256,8,0,0,asm,10001+20000,126.6955
gfx938,f8_w8a8_block,torch.float16,6,384,3072,256,8,0,0,asm,10006+20000,149.3566
gfx938,f8_w8a8_block,torch.float16,8,384,3072,256,8,0,0,asm,10006+20000,187.3859
gfx938,f8_w8a8_block,torch.float16,12,384,3072,256,8,0,0,asm,10006+20000,246.4426
gfx938,f8_w8a8_block,torch.float16,16,384,3072,256,8,0,0,asm,10006+20000,297.0613
gfx938,f8_w8a8_block,torch.float16,20,384,3072,256,8,0,0,asm,10006+20000,322.1529
gfx938,f8_w8a8_block,torch.float16,24,384,3072,256,8,0,0,asm,10006+20000,369.5548
gfx938,f8_w8a8_block,torch.float16,28,384,3072,256,8,0,0,asm,10006+20000,425.1955
gfx938,f8_w8a8_block,torch.float16,32,384,3072,256,8,0,0,asm,10006+20000,440.5555
gfx938,f8_w8a8_block,torch.float16,36,384,3072,256,8,0,0,asm,10006+20000,467.4997
gfx938,f8_w8a8_block,torch.float16,40,384,3072,256,8,0,0,asm,10006+20000,475.6513
gfx938,f8_w8a8_block,torch.float16,44,384,3072,256,8,0,0,asm,10006+20000,507.3901
gfx938,f8_w8a8_block,torch.float16,48,384,3072,256,8,0,0,asm,10006+20000,517.7227
gfx938,f8_w8a8_block,torch.float16,56,384,3072,256,8,0,0,asm,10006+20000,531.4405
gfx938,f8_w8a8_block,torch.float16,64,384,3072,256,8,0,0,asm,10006+20000,562.2109
gfx938,f8_w8a8_block,torch.float16,72,384,3072,256,8,0,0,asm,10006+20000,571.7014
gfx938,f8_w8a8_block,torch.float16,80,384,3072,256,8,0,0,asm,10006+20000,585.0571
gfx938,f8_w8a8_block,torch.float16,96,384,3072,256,8,0,0,asm,10006+20000,617.6802
gfx938,f8_w8a8_block,torch.float16,104,384,3072,256,8,0,0,asm,10006+20000,630.278
gfx938,f8_w8a8_block,torch.float16,112,384,3072,256,8,0,0,asm,10006+20000,629.1917
gfx938,f8_w8a8_block,torch.float16,128,384,3072,256,8,0,0,asm,10006+20000,632.2991
gfx938,f8_w8a8_block,torch.float16,144,384,3072,256,8,0,0,asm,10006+20000,635.5074
gfx938,f8_w8a8_block,torch.float16,160,384,3072,256,8,0,0,asm,10006+20000,640.2232
gfx938,f8_w8a8_block,torch.float16,192,384,3072,256,8,0,0,asm,10006+20000,645.8653
gfx938,f8_w8a8_block,torch.float16,224,384,3072,256,8,0,0,asm,10006+20000,646.1769
gfx938,f8_w8a8_block,torch.float16,256,384,3072,256,8,0,0,asm,10006+20000,650.0422
gfx938,f8_w8a8_block,torch.float16,320,384,3072,256,8,0,0,asm,10006+20000,661.3263
gfx938,f8_w8a8_block,torch.float16,384,384,3072,256,8,0,0,asm,10006+20000,677.3178
gfx938,f8_w8a8_block,torch.float16,448,384,3072,256,8,0,0,asm,11010+21000,687.4904
gfx938,f8_w8a8_block,torch.float16,512,384,3072,256,8,0,0,asm,11010+21000,700.4841
gfx938,f8_w8a8_block,torch.float16,768,384,3072,256,8,0,0,asm,11010+21000,779.8101
gfx938,f8_w8a8_block,torch.float16,896,384,3072,256,8,0,0,asm,11010+21000,778.1343
gfx938,f8_w8a8_block,torch.float16,960,384,3072,256,8,0,0,asm,11010+21000,830.3867
gfx938,f8_w8a8_block,torch.float16,1024,384,3072,256,8,0,0,asm,12003+22000,844.1972
gfx938,f8_w8a8_block,torch.float16,1280,384,3072,256,8,0,0,asm,12003+22000,868.9634
gfx938,f8_w8a8_block,torch.float16,1536,384,3072,256,8,0,0,asm,12003+22000,966.8914
gfx938,f8_w8a8_block,torch.float16,1920,384,3072,256,8,0,0,asm,12003+22000,1074.9331
gfx938,f8_w8a8_block,torch.float16,2048,384,3072,256,8,0,0,asm,12003+22000,1186.2758
gfx938,f8_w8a8_block,torch.float16,2304,384,3072,256,8,0,0,asm,13001+22000,1380.894
gfx938,f8_w8a8_block,torch.float16,2560,384,3072,256,8,0,0,asm,13001+22000,1404.4476
gfx938,f8_w8a8_block,torch.float16,3072,384,3072,256,8,0,0,asm,13001+22000,1453.7779
gfx938,f8_w8a8_block,torch.float16,3584,384,3072,256,8,0,0,asm,13001+22000,1557.5754
gfx938,f8_w8a8_block,torch.float16,3840,384,3072,256,8,0,0,asm,13001+23000,1709.8021
gfx938,f8_w8a8_block,torch.float16,4096,384,3072,256,8,0,0,asm,12005+22000,1977.001
gfx938,f8_w8a8_block,torch.float16,4608,384,3072,256,8,0,0,asm,12005+22000,2227.3243
gfx938,f8_w8a8_block,torch.float16,5120,384,3072,256,8,0,0,asm,12005+22000,2342.4227
gfx938,f8_w8a8_block,torch.float16,6144,384,3072,256,8,0,0,asm,13001+23000,2614.8596
gfx938,f8_w8a8_block,torch.float16,7168,384,3072,256,8,0,0,asm,13001+23000,2704.6866
gfx938,f8_w8a8_block,torch.float16,8192,384,3072,256,8,0,0,asm,13001+23000,3214.4025
gfx938,f8_w8a8_block,torch.float16,10240,384,3072,256,8,0,0,asm,13001+23000,3899.8566
gfx938,f8_w8a8_block,torch.float16,12288,384,3072,256,8,0,0,asm,13001+23000,4531.551
gfx938,f8_w8a8_block,torch.float16,16384,384,3072,256,8,0,0,asm,13001+23000,5840.8341
gfx938,f8_w8a8_block,torch.float16,24576,384,3072,256,8,0,0,asm,13001+23000,8385.0091
gfx938,f8_w8a8_block,torch.float16,32768,384,3072,256,8,0,0,asm,13001+23000,11024.1562
gfx938,f8_w8a8_block,torch.float16,1,1536,3072,64,8,0,0,asm,10006+20000,124.9272
gfx938,f8_w8a8_block,torch.float16,2,1536,3072,64,8,0,0,asm,10002+20000,184.5058
gfx938,f8_w8a8_block,torch.float16,4,1536,3072,64,8,0,0,asm,10006+20000,315.4275
gfx938,f8_w8a8_block,torch.float16,6,1536,3072,64,8,0,0,asm,10006+20000,423.3682
gfx938,f8_w8a8_block,torch.float16,8,1536,3072,64,8,0,0,asm,10006+20000,440.0586
gfx938,f8_w8a8_block,torch.float16,12,1536,3072,64,8,0,0,asm,10006+20000,540.1087
gfx938,f8_w8a8_block,torch.float16,16,1536,3072,64,8,0,0,asm,10006+20000,596.9254
gfx938,f8_w8a8_block,torch.float16,20,1536,3072,64,8,0,0,asm,10006+20000,613.5538
gfx938,f8_w8a8_block,torch.float16,24,1536,3072,64,8,0,0,asm,10006+20000,628.8296
gfx938,f8_w8a8_block,torch.float16,28,1536,3072,64,8,0,0,asm,10006+20000,670.7272
gfx938,f8_w8a8_block,torch.float16,32,1536,3072,64,8,0,0,asm,10006+20000,663.1146
gfx938,f8_w8a8_block,torch.float16,36,1536,3072,64,8,0,0,asm,10006+20000,676.0126
gfx938,f8_w8a8_block,torch.float16,40,1536,3072,64,8,0,0,asm,10006+20000,675.2884
gfx938,f8_w8a8_block,torch.float16,44,1536,3072,64,8,0,0,asm,10006+20000,681.5031
gfx938,f8_w8a8_block,torch.float16,48,1536,3072,64,8,0,0,asm,12003+22001,688.4757
gfx938,f8_w8a8_block,torch.float16,56,1536,3072,64,8,0,0,asm,10006+20000,691.5746
gfx938,f8_w8a8_block,torch.float16,64,1536,3072,64,8,0,0,asm,10006+20000,692.2429
gfx938,f8_w8a8_block,torch.float16,72,1536,3072,64,8,0,0,asm,12003+22001,688.442
gfx938,f8_w8a8_block,torch.float16,80,1536,3072,64,8,0,0,asm,10006+20000,690.0083
gfx938,f8_w8a8_block,torch.float16,96,1536,3072,64,8,0,0,asm,12003+22002,711.1282
gfx938,f8_w8a8_block,torch.float16,104,1536,3072,64,8,0,0,asm,12003+22001,696.5683
gfx938,f8_w8a8_block,torch.float16,112,1536,3072,64,8,0,0,asm,12003+22001,698.0841
gfx938,f8_w8a8_block,torch.float16,128,1536,3072,64,8,0,0,asm,12003+22001,720.4196
gfx938,f8_w8a8_block,torch.float16,144,1536,3072,64,8,0,0,asm,12003+22001,702.7156
gfx938,f8_w8a8_block,torch.float16,160,1536,3072,64,8,0,0,asm,12003+22001,711.6082
gfx938,f8_w8a8_block,torch.float16,192,1536,3072,64,8,0,0,asm,12003+22001,761.4944
gfx938,f8_w8a8_block,torch.float16,224,1536,3072,64,8,0,0,asm,12003+22001,720.0124
gfx938,f8_w8a8_block,torch.float16,256,1536,3072,64,8,0,0,asm,12003+22001,723.625
gfx938,f8_w8a8_block,torch.float16,320,1536,3072,64,8,0,0,asm,12003+22001,742.8671
gfx938,f8_w8a8_block,torch.float16,384,1536,3072,64,8,0,0,asm,12003+22001,813.1488
gfx938,f8_w8a8_block,torch.float16,448,1536,3072,64,8,0,0,asm,12003+22001,811.6667
gfx938,f8_w8a8_block,torch.float16,512,1536,3072,64,8,0,0,asm,12003+22000,1008.7775
gfx938,f8_w8a8_block,torch.float16,768,1536,3072,64,8,0,0,asm,13001+22000,1064.011
gfx938,f8_w8a8_block,torch.float16,896,1536,3072,64,8,0,0,asm,13001+22000,1084.3057
gfx938,f8_w8a8_block,torch.float16,960,1536,3072,64,8,0,0,asm,13001+22000,1237.1219
gfx938,f8_w8a8_block,torch.float16,1024,1536,3072,64,8,0,0,asm,13001+22000,1476.5315
gfx938,f8_w8a8_block,torch.float16,1280,1536,3072,64,8,0,0,asm,12005+22000,1796.6397
gfx938,f8_w8a8_block,torch.float16,1536,1536,3072,64,8,0,0,asm,13001+22000,2017.7420
gfx938,f8_w8a8_block,torch.float16,1920,1536,3072,64,8,0,0,asm,13001+22000,2136.5373
gfx938,f8_w8a8_block,torch.float16,2048,1536,3072,64,8,0,0,asm,13001+22000,2407.4415
gfx938,f8_w8a8_block,torch.float16,2304,1536,3072,64,8,0,0,asm,13001+23000,2837.9661
gfx938,f8_w8a8_block,torch.float16,2560,1536,3072,64,8,0,0,asm,13001+23000,2906.9257
gfx938,f8_w8a8_block,torch.float16,3072,1536,3072,64,8,0,0,asm,13001+22000,3408.5995
gfx938,f8_w8a8_block,torch.float16,3584,1536,3072,64,8,0,0,asm,13001+23000,3882.9218
gfx938,f8_w8a8_block,torch.float16,3840,1536,3072,64,8,0,0,asm,13001+23000,3938.888
gfx938,f8_w8a8_block,torch.float16,4096,1536,3072,64,8,0,0,asm,13001+23000,4351.1558
gfx938,f8_w8a8_block,torch.float16,4608,1536,3072,64,8,0,0,asm,13001+23000,4852.0379
gfx938,f8_w8a8_block,torch.float16,5120,1536,3072,64,8,0,0,asm,13001+23000,5303.8594
gfx938,f8_w8a8_block,torch.float16,6144,1536,3072,64,8,0,0,asm,13001+23000,6242.0787
gfx938,f8_w8a8_block,torch.float16,7168,1536,3072,64,8,0,0,asm,13001+23000,7198.6896
gfx938,f8_w8a8_block,torch.float16,8192,1536,3072,64,8,0,0,asm,13001+23000,8159.23309
gfx938,f8_w8a8_block,torch.float16,10240,1536,3072,64,8,0,0,asm,13001+23000,10081.0697
gfx938,f8_w8a8_block,torch.float16,12288,1536,3072,64,8,0,0,asm,13001+23000,11951.0998
gfx938,f8_w8a8_block,torch.float16,16384,1536,3072,64,8,0,0,asm,13001+23000,15692.1712
gfx938,f8_w8a8_block,torch.float16,24576,1536,3072,64,8,0,0,asm,13001+23000,23308.5444
gfx938,f8_w8a8_block,torch.float16,32768,1536,3072,64,8,0,0,asm,13001+23000,30796.3452
arch,quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
gfx936,int8_w8a8_block,torch.float16,1,128,7168,256,8,0,0,asm,10008+20000,62.7606
gfx936,int8_w8a8_block,torch.float16,2,128,7168,256,8,0,0,asm,10007+20101,77.572
gfx936,int8_w8a8_block,torch.float16,3,128,7168,256,8,0,0,asm,10001+20101,94.0854
gfx936,int8_w8a8_block,torch.float16,4,128,7168,256,8,0,0,asm,10003+20101,111.1195
gfx936,int8_w8a8_block,torch.float16,5,128,7168,256,8,0,0,asm,10007+20101,132.7017
gfx936,int8_w8a8_block,torch.float16,6,128,7168,256,8,0,0,asm,10007+20101,155.4288
gfx936,int8_w8a8_block,torch.float16,7,128,7168,256,8,0,0,asm,10007+20101,169.909
gfx936,int8_w8a8_block,torch.float16,8,128,7168,256,8,0,0,asm,10007+20101,176.9162
gfx936,int8_w8a8_block,torch.float16,9,128,7168,256,8,0,0,asm,10007+20101,192.9285
gfx936,int8_w8a8_block,torch.float16,10,128,7168,256,8,0,0,asm,10007+20101,204.7479
gfx936,int8_w8a8_block,torch.float16,11,128,7168,256,8,0,0,asm,10007+20101,217.0006
gfx936,int8_w8a8_block,torch.float16,12,128,7168,256,8,0,0,asm,10007+20101,228.7678
gfx936,int8_w8a8_block,torch.float16,13,128,7168,256,8,0,0,asm,10007+20101,248.1068
gfx936,int8_w8a8_block,torch.float16,14,128,7168,256,8,0,0,asm,10007+20101,257.9829
gfx936,int8_w8a8_block,torch.float16,15,128,7168,256,8,0,0,asm,10007+20101,266.59
gfx936,int8_w8a8_block,torch.float16,16,128,7168,256,8,0,0,asm,10007+20101,273.1376
gfx936,int8_w8a8_block,torch.float16,17,128,7168,256,8,0,0,asm,10007+20101,278.4476
gfx936,int8_w8a8_block,torch.float16,18,128,7168,256,8,0,0,asm,10007+20101,287.6112
gfx936,int8_w8a8_block,torch.float16,20,128,7168,256,8,0,0,asm,10007+20101,309.1361
gfx936,int8_w8a8_block,torch.float16,24,128,7168,256,8,0,0,asm,10007+20101,353.1594
gfx936,int8_w8a8_block,torch.float16,28,128,7168,256,8,0,0,asm,10007+20101,402.2906
gfx936,int8_w8a8_block,torch.float16,32,128,7168,256,8,0,0,asm,10007+20000,432.625
gfx936,int8_w8a8_block,torch.float16,34,128,7168,256,8,0,0,asm,10007+20000,429.6559
gfx936,int8_w8a8_block,torch.float16,36,128,7168,256,8,0,0,asm,10007+20101,443.3995
gfx936,int8_w8a8_block,torch.float16,40,128,7168,256,8,0,0,asm,10007+20101,461.6817
gfx936,int8_w8a8_block,torch.float16,44,128,7168,256,8,0,0,asm,10007+20100,482.5334
gfx936,int8_w8a8_block,torch.float16,48,128,7168,256,8,0,0,asm,10007+20100,494.1135
gfx936,int8_w8a8_block,torch.float16,56,128,7168,256,8,0,0,asm,10007+20100,522.4518
gfx936,int8_w8a8_block,torch.float16,64,128,7168,256,8,0,0,asm,10007+20100,541.7977
gfx936,int8_w8a8_block,torch.float16,68,128,7168,256,8,0,0,asm,10007+20100,544.4355
gfx936,int8_w8a8_block,torch.float16,72,128,7168,256,8,0,0,asm,10007+20100,559.8259
gfx936,int8_w8a8_block,torch.float16,80,128,7168,256,8,0,0,asm,10007+20100,579.9696
gfx936,int8_w8a8_block,torch.float16,88,128,7168,256,8,0,0,asm,10007+20100,595.2271
gfx936,int8_w8a8_block,torch.float16,96,128,7168,256,8,0,0,asm,10007+20100,604.7679
gfx936,int8_w8a8_block,torch.float16,104,128,7168,256,8,0,0,asm,10007+20100,611.5854
gfx936,int8_w8a8_block,torch.float16,112,128,7168,256,8,0,0,asm,10007+20100,619.1943
gfx936,int8_w8a8_block,torch.float16,128,128,7168,256,8,0,0,asm,10007+20100,632.2913
gfx936,int8_w8a8_block,torch.float16,144,128,7168,256,8,0,0,asm,10007+20100,646.3492
gfx936,int8_w8a8_block,torch.float16,160,128,7168,256,8,0,0,asm,10007+20100,653.7156
gfx936,int8_w8a8_block,torch.float16,192,128,7168,256,8,0,0,asm,10007+20100,665.4176
gfx936,int8_w8a8_block,torch.float16,224,128,7168,256,8,0,0,asm,10007+20100,686.6979
gfx936,int8_w8a8_block,torch.float16,256,128,7168,256,8,0,0,asm,10007+20100,691.297
gfx936,int8_w8a8_block,torch.float16,320,128,7168,256,8,0,0,asm,10007+20100,714.5745
gfx936,int8_w8a8_block,torch.float16,384,128,7168,256,8,0,0,asm,10007+20000,744.3677
gfx936,int8_w8a8_block,torch.float16,448,128,7168,256,8,0,0,asm,10007+20101,758.6653
gfx936,int8_w8a8_block,torch.float16,512,128,7168,256,8,0,0,asm,10007+20101,786.8785
gfx936,int8_w8a8_block,torch.float16,576,128,7168,256,8,0,0,asm,10002+20101,828.8703
gfx936,int8_w8a8_block,torch.float16,640,128,7168,256,8,0,0,asm,10006+20101,843.8174
gfx936,int8_w8a8_block,torch.float16,704,128,7168,256,8,0,0,asm,11007+21000,867.3545
gfx936,int8_w8a8_block,torch.float16,768,128,7168,256,8,0,0,asm,11007+21000,893.5371
gfx936,int8_w8a8_block,torch.float16,832,128,7168,256,8,0,0,asm,10004+20101,924.2304
gfx936,int8_w8a8_block,torch.float16,896,128,7168,256,8,0,0,asm,10004+20101,949.6127
gfx936,int8_w8a8_block,torch.float16,960,128,7168,256,8,0,0,asm,11007+21101,962.014
gfx936,int8_w8a8_block,torch.float16,1024,128,7168,256,8,0,0,asm,11007+21101,982.5596
gfx936,int8_w8a8_block,torch.float16,1152,128,7168,256,8,0,0,asm,11007+21101,1066.0459
gfx936,int8_w8a8_block,torch.float16,1280,128,7168,256,8,0,0,asm,11007+21101,1116.8621
gfx936,int8_w8a8_block,torch.float16,1408,128,7168,256,8,0,0,asm,12000+22000,1178.6121
gfx936,int8_w8a8_block,torch.float16,1536,128,7168,256,8,0,0,asm,12001+22000,1193.2156
gfx936,int8_w8a8_block,torch.float16,1664,128,7168,256,8,0,0,asm,11010+21000,1250.1117
gfx936,int8_w8a8_block,torch.float16,1792,128,7168,256,8,0,0,asm,11010+21000,1293.8122
gfx936,int8_w8a8_block,torch.float16,1920,128,7168,256,8,0,0,asm,11010+21000,1369.8287
gfx936,int8_w8a8_block,torch.float16,2048,128,7168,256,8,0,0,asm,11010+21100,1422.1323
gfx936,int8_w8a8_block,torch.float16,2304,128,7168,256,8,0,0,asm,11010+21000,1572.7088
gfx936,int8_w8a8_block,torch.float16,2560,128,7168,256,8,0,0,asm,11009+21100,1688.1345
gfx936,int8_w8a8_block,torch.float16,2816,128,7168,256,8,0,0,asm,11010+21100,1802.7783
gfx936,int8_w8a8_block,torch.float16,3072,128,7168,256,8,0,0,asm,12003+22000,1897.6074
gfx936,int8_w8a8_block,torch.float16,3328,128,7168,256,8,0,0,asm,12003+22000,1979.2772
gfx936,int8_w8a8_block,torch.float16,3584,128,7168,256,8,0,0,asm,12003+22000,2043.1447
gfx936,int8_w8a8_block,torch.float16,3840,128,7168,256,8,0,0,asm,12003+22000,2184.6107
gfx936,int8_w8a8_block,torch.float16,4096,128,7168,256,8,0,0,asm,12003+22000,2334.7564
gfx936,int8_w8a8_block,torch.float16,4608,128,7168,256,8,0,0,asm,12003+22000,2659.1505
gfx936,int8_w8a8_block,torch.float16,5120,128,7168,256,8,0,0,asm,12003+22000,2817.7639
gfx936,int8_w8a8_block,torch.float16,5632,128,7168,256,8,0,0,asm,12003+22000,2967.6633
gfx936,int8_w8a8_block,torch.float16,6144,128,7168,256,8,0,0,asm,12003+22000,3291.914
gfx936,int8_w8a8_block,torch.float16,6656,128,7168,256,8,0,0,asm,13001+23000,3421.6085
gfx936,int8_w8a8_block,torch.float16,7168,128,7168,256,8,0,0,asm,13001+23000,3532.8742
gfx936,int8_w8a8_block,torch.float16,7680,128,7168,256,8,0,0,asm,13001+23000,3724.739
gfx936,int8_w8a8_block,torch.float16,8192,128,7168,256,8,0,0,asm,13001+23000,4133.3506
gfx936,int8_w8a8_block,torch.float16,10240,128,7168,256,8,0,0,asm,13001+23000,5080.0063
gfx936,int8_w8a8_block,torch.float16,12288,128,7168,256,8,0,0,asm,13001+23000,5935.4214
gfx936,int8_w8a8_block,torch.float16,14336,128,7168,256,8,0,0,asm,13001+23000,6797.3674
gfx936,int8_w8a8_block,torch.float16,16384,128,7168,256,8,0,0,asm,13001+23000,7704.9349
gfx936,int8_w8a8_block,torch.float16,17408,128,7168,256,8,0,0,asm,13001+23000,8254.6709
gfx936,int8_w8a8_block,torch.float16,24576,128,7168,256,8,0,0,asm,13001+23000,11162.5584
gfx936,int8_w8a8_block,torch.float16,32768,128,7168,256,8,0,0,asm,13001+23000,14747.3124
gfx936,int8_w8a8_block,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,14859.3376
gfx936,int8_w8a8_block,torch.float16,49152,128,7168,256,8,0,0,asm,13001+23000,21041.0904
gfx936,int8_w8a8_block,torch.float16,57344,128,7168,256,8,0,0,asm,13001+23000,24838.7834
gfx936,int8_w8a8_block,torch.float16,1,256,7168,256,8,0,0,asm,10008+20000,80.7245
gfx936,int8_w8a8_block,torch.float16,2,256,7168,256,8,0,0,asm,10007+20000,118.7213
gfx936,int8_w8a8_block,torch.float16,3,256,7168,256,8,0,0,asm,10007+20000,156.7637
gfx936,int8_w8a8_block,torch.float16,4,256,7168,256,8,0,0,asm,10003+20000,200.2542
gfx936,int8_w8a8_block,torch.float16,5,256,7168,256,8,0,0,asm,10007+20000,224.9911
gfx936,int8_w8a8_block,torch.float16,6,256,7168,256,8,0,0,asm,10007+20000,253.4003
gfx936,int8_w8a8_block,torch.float16,7,256,7168,256,8,0,0,asm,10007+20000,285.5153
gfx936,int8_w8a8_block,torch.float16,8,256,7168,256,8,0,0,asm,10007+20000,302.3235
gfx936,int8_w8a8_block,torch.float16,9,256,7168,256,8,0,0,asm,10007+20000,332.5963
gfx936,int8_w8a8_block,torch.float16,10,256,7168,256,8,0,0,asm,10007+20000,356.543
gfx936,int8_w8a8_block,torch.float16,11,256,7168,256,8,0,0,asm,10007+20000,379.9048
gfx936,int8_w8a8_block,torch.float16,12,256,7168,256,8,0,0,asm,10007+20000,396.6579
gfx936,int8_w8a8_block,torch.float16,13,256,7168,256,8,0,0,asm,10007+20000,421.5194
gfx936,int8_w8a8_block,torch.float16,14,256,7168,256,8,0,0,asm,10007+20000,449.1545
gfx936,int8_w8a8_block,torch.float16,15,256,7168,256,8,0,0,asm,10007+20000,464.3584
gfx936,int8_w8a8_block,torch.float16,16,256,7168,256,8,0,0,asm,10007+20000,476.141
gfx936,int8_w8a8_block,torch.float16,17,256,7168,256,8,0,0,asm,10007+20000,487.9287
gfx936,int8_w8a8_block,torch.float16,18,256,7168,256,8,0,0,asm,10007+20000,510.899
gfx936,int8_w8a8_block,torch.float16,20,256,7168,256,8,0,0,asm,10007+20000,549.3483
gfx936,int8_w8a8_block,torch.float16,24,256,7168,256,8,0,0,asm,10007+20000,629.1473
gfx936,int8_w8a8_block,torch.float16,28,256,7168,256,8,0,0,asm,10007+20000,707.0826
gfx936,int8_w8a8_block,torch.float16,32,256,7168,256,8,0,0,asm,10007+20000,759.8868
gfx936,int8_w8a8_block,torch.float16,34,256,7168,256,8,0,0,asm,10007+20000,764.212
gfx936,int8_w8a8_block,torch.float16,36,256,7168,256,8,0,0,asm,10007+20000,794.3741
gfx936,int8_w8a8_block,torch.float16,40,256,7168,256,8,0,0,asm,10007+20000,826.9443
gfx936,int8_w8a8_block,torch.float16,44,256,7168,256,8,0,0,asm,10007+20000,865.1451
gfx936,int8_w8a8_block,torch.float16,48,256,7168,256,8,0,0,asm,10007+20000,888.0602
gfx936,int8_w8a8_block,torch.float16,56,256,7168,256,8,0,0,asm,10007+20000,934.0327
gfx936,int8_w8a8_block,torch.float16,64,256,7168,256,8,0,0,asm,10007+20000,969.9721
gfx936,int8_w8a8_block,torch.float16,68,256,7168,256,8,0,0,asm,10007+20000,979.8173
gfx936,int8_w8a8_block,torch.float16,72,256,7168,256,8,0,0,asm,10007+20000,1006.7779
gfx936,int8_w8a8_block,torch.float16,80,256,7168,256,8,0,0,asm,10007+20000,1042.8624
gfx936,int8_w8a8_block,torch.float16,88,256,7168,256,8,0,0,asm,10007+20000,1074.5793
gfx936,int8_w8a8_block,torch.float16,96,256,7168,256,8,0,0,asm,10007+20000,1093.5004
gfx936,int8_w8a8_block,torch.float16,104,256,7168,256,8,0,0,asm,10007+20000,1102.8706
gfx936,int8_w8a8_block,torch.float16,112,256,7168,256,8,0,0,asm,10007+20000,1120.0809
gfx936,int8_w8a8_block,torch.float16,128,256,7168,256,8,0,0,asm,10007+20000,1151.5798
gfx936,int8_w8a8_block,torch.float16,144,256,7168,256,8,0,0,asm,10007+20000,1163.1415
gfx936,int8_w8a8_block,torch.float16,160,256,7168,256,8,0,0,asm,10007+20000,1176.8686
gfx936,int8_w8a8_block,torch.float16,192,256,7168,256,8,0,0,asm,10007+20000,1193.123
gfx936,int8_w8a8_block,torch.float16,224,256,7168,256,8,0,0,asm,10007+20000,1219.1989
gfx936,int8_w8a8_block,torch.float16,256,256,7168,256,8,0,0,asm,10007+20000,1234.1733
gfx936,int8_w8a8_block,torch.float16,320,256,7168,256,8,0,0,asm,10007+20000,1247.3027
gfx936,int8_w8a8_block,torch.float16,384,256,7168,256,8,0,0,asm,10007+20000,1274.2434
gfx936,int8_w8a8_block,torch.float16,448,256,7168,256,8,0,0,asm,10007+20000,1308.2962
gfx936,int8_w8a8_block,torch.float16,512,256,7168,256,8,0,0,asm,11005+21000,1362.198
gfx936,int8_w8a8_block,torch.float16,576,256,7168,256,8,0,0,asm,11007+21000,1392.7605
gfx936,int8_w8a8_block,torch.float16,640,256,7168,256,8,0,0,asm,11007+21000,1412.2071
gfx936,int8_w8a8_block,torch.float16,704,256,7168,256,8,0,0,asm,11007+21000,1444.9837
gfx936,int8_w8a8_block,torch.float16,768,256,7168,256,8,0,0,asm,11007+21000,1470.1744
gfx936,int8_w8a8_block,torch.float16,832,256,7168,256,8,0,0,asm,11007+21000,1497.4842
gfx936,int8_w8a8_block,torch.float16,896,256,7168,256,8,0,0,asm,11007+21000,1518.252
gfx936,int8_w8a8_block,torch.float16,960,256,7168,256,8,0,0,asm,11007+21000,1528.7868
gfx936,int8_w8a8_block,torch.float16,1024,256,7168,256,8,0,0,asm,11007+21000,1552.9606
gfx936,int8_w8a8_block,torch.float16,1152,256,7168,256,8,0,0,asm,12000+22000,1637.8453
gfx936,int8_w8a8_block,torch.float16,1280,256,7168,256,8,0,0,asm,12000+22000,1670.9866
gfx936,int8_w8a8_block,torch.float16,1408,256,7168,256,8,0,0,asm,12000+22000,1735.3633
gfx936,int8_w8a8_block,torch.float16,1536,256,7168,256,8,0,0,asm,11010+21000,1778.5593
gfx936,int8_w8a8_block,torch.float16,1664,256,7168,256,8,0,0,asm,12000+22000,1833.8578
gfx936,int8_w8a8_block,torch.float16,1792,256,7168,256,8,0,0,asm,12001+22000,1910.7194
gfx936,int8_w8a8_block,torch.float16,1920,256,7168,256,8,0,0,asm,12001+22000,1972.2045
gfx936,int8_w8a8_block,torch.float16,2048,256,7168,256,8,0,0,asm,12001+22000,2084.3359
gfx936,int8_w8a8_block,torch.float16,2304,256,7168,256,8,0,0,asm,12003+22000,2256.3812
gfx936,int8_w8a8_block,torch.float16,2560,256,7168,256,8,0,0,asm,12003+22000,2383.4745
gfx936,int8_w8a8_block,torch.float16,2816,256,7168,256,8,0,0,asm,12003+22000,2460.2104
gfx936,int8_w8a8_block,torch.float16,3072,256,7168,256,8,0,0,asm,12003+22000,2541.0377
gfx936,int8_w8a8_block,torch.float16,3328,256,7168,256,8,0,0,asm,12002+22000,2635.4526
gfx936,int8_w8a8_block,torch.float16,3584,256,7168,256,8,0,0,asm,12003+22000,2742.33
gfx936,int8_w8a8_block,torch.float16,3840,256,7168,256,8,0,0,asm,12003+22000,2879.9588
gfx936,int8_w8a8_block,torch.float16,4096,256,7168,256,8,0,0,asm,12003+22000,3101.3169
gfx936,int8_w8a8_block,torch.float16,4608,256,7168,256,8,0,0,asm,12003+22000,3600.3408
gfx936,int8_w8a8_block,torch.float16,5120,256,7168,256,8,0,0,asm,12003+22000,3814.8517
gfx936,int8_w8a8_block,torch.float16,5632,256,7168,256,8,0,0,asm,12003+22000,3988.5398
gfx936,int8_w8a8_block,torch.float16,6144,256,7168,256,8,0,0,asm,12002+22000,4396.1157
gfx936,int8_w8a8_block,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23000,4648.7067
gfx936,int8_w8a8_block,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23000,4818.7636
gfx936,int8_w8a8_block,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23000,5024.0016
gfx936,int8_w8a8_block,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23000,5549.7372
gfx936,int8_w8a8_block,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23000,6802.854
gfx936,int8_w8a8_block,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23000,7901.7596
gfx936,int8_w8a8_block,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23000,9098.0764
gfx936,int8_w8a8_block,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23000,10190.1389
gfx936,int8_w8a8_block,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23000,10946.5745
gfx936,int8_w8a8_block,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23000,14740.2802
gfx936,int8_w8a8_block,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23000,19489.3806
gfx936,int8_w8a8_block,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23000,22699.7344
gfx936,int8_w8a8_block,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23000,27492.7934
gfx938,int8_w8a8_block,torch.float16,1,128,7168,256,8,0,0,asm,10008+20100,64.3619
gfx938,int8_w8a8_block,torch.float16,2,128,7168,256,8,0,0,asm,10007+20101,74.3393
gfx938,int8_w8a8_block,torch.float16,3,128,7168,256,8,0,0,asm,10002+20101,85.2683
gfx938,int8_w8a8_block,torch.float16,4,128,7168,256,8,0,0,asm,10007+20101,102.7658
gfx938,int8_w8a8_block,torch.float16,5,128,7168,256,8,0,0,asm,10006+20101,126.6177
gfx938,int8_w8a8_block,torch.float16,6,128,7168,256,8,0,0,asm,10006+20101,131.0115
gfx938,int8_w8a8_block,torch.float16,7,128,7168,256,8,0,0,asm,10005+20101,137.7564
gfx938,int8_w8a8_block,torch.float16,8,128,7168,256,8,0,0,asm,10006+20101,143.7584
gfx938,int8_w8a8_block,torch.float16,9,128,7168,256,8,0,0,asm,10002+20101,157.2804
gfx938,int8_w8a8_block,torch.float16,10,128,7168,256,8,0,0,asm,10002+20101,170.1256
gfx938,int8_w8a8_block,torch.float16,11,128,7168,256,8,0,0,asm,10007+20101,202.2689
gfx938,int8_w8a8_block,torch.float16,12,128,7168,256,8,0,0,asm,10002+20101,200.4762
gfx938,int8_w8a8_block,torch.float16,13,128,7168,256,8,0,0,asm,10002+20101,204.1725
gfx938,int8_w8a8_block,torch.float16,14,128,7168,256,8,0,0,asm,10002+20101,209.0177
gfx938,int8_w8a8_block,torch.float16,15,128,7168,256,8,0,0,asm,10001+20101,214.7243
gfx938,int8_w8a8_block,torch.float16,16,128,7168,256,8,0,0,asm,10002+20101,218.2157
gfx938,int8_w8a8_block,torch.float16,17,128,7168,256,8,0,0,asm,10003+20101,222.0033
gfx938,int8_w8a8_block,torch.float16,18,128,7168,256,8,0,0,asm,10002+20101,226.8935
gfx938,int8_w8a8_block,torch.float16,20,128,7168,256,8,0,0,asm,10006+20101,253.5108
gfx938,int8_w8a8_block,torch.float16,24,128,7168,256,8,0,0,asm,10002+20101,277.08
gfx938,int8_w8a8_block,torch.float16,28,128,7168,256,8,0,0,asm,10002+20101,327.7822
gfx938,int8_w8a8_block,torch.float16,32,128,7168,256,8,0,0,asm,10002+20101,338.7196
gfx938,int8_w8a8_block,torch.float16,34,128,7168,256,8,0,0,asm,10002+20101,323.1064
gfx938,int8_w8a8_block,torch.float16,36,128,7168,256,8,0,0,asm,10001+20101,336.2674
gfx938,int8_w8a8_block,torch.float16,40,128,7168,256,8,0,0,asm,10005+20101,361.1001
gfx938,int8_w8a8_block,torch.float16,44,128,7168,256,8,0,0,asm,10006+20101,371.578
gfx938,int8_w8a8_block,torch.float16,48,128,7168,256,8,0,0,asm,10002+20101,376.6324
gfx938,int8_w8a8_block,torch.float16,56,128,7168,256,8,0,0,asm,10002+20101,390.3019
gfx938,int8_w8a8_block,torch.float16,64,128,7168,256,8,0,0,asm,10002+20101,415.6762
gfx938,int8_w8a8_block,torch.float16,68,128,7168,256,8,0,0,asm,10002+20101,429.6441
gfx938,int8_w8a8_block,torch.float16,72,128,7168,256,8,0,0,asm,10002+20101,430.7736
gfx938,int8_w8a8_block,torch.float16,80,128,7168,256,8,0,0,asm,10007+20101,452.7017
gfx938,int8_w8a8_block,torch.float16,88,128,7168,256,8,0,0,asm,10002+20101,447.3998
gfx938,int8_w8a8_block,torch.float16,96,128,7168,256,8,0,0,asm,10002+20101,447.6351
gfx938,int8_w8a8_block,torch.float16,104,128,7168,256,8,0,0,asm,10001+20101,460.7016
gfx938,int8_w8a8_block,torch.float16,112,128,7168,256,8,0,0,asm,10002+20101,460.3201
gfx938,int8_w8a8_block,torch.float16,128,128,7168,256,8,0,0,asm,10002+20101,463.9509
gfx938,int8_w8a8_block,torch.float16,144,128,7168,256,8,0,0,asm,10002+20101,489.5343
gfx938,int8_w8a8_block,torch.float16,160,128,7168,256,8,0,0,asm,10002+20101,494.0718
gfx938,int8_w8a8_block,torch.float16,192,128,7168,256,8,0,0,asm,10002+20101,503.7496
gfx938,int8_w8a8_block,torch.float16,224,128,7168,256,8,0,0,asm,10001+20101,509.2415
gfx938,int8_w8a8_block,torch.float16,256,128,7168,256,8,0,0,asm,10005+20101,514.1414
gfx938,int8_w8a8_block,torch.float16,320,128,7168,256,8,0,0,asm,10006+20101,533.5136
gfx938,int8_w8a8_block,torch.float16,384,128,7168,256,8,0,0,asm,10002+20101,538.608
gfx938,int8_w8a8_block,torch.float16,448,128,7168,256,8,0,0,asm,10002+20101,563.3719
gfx938,int8_w8a8_block,torch.float16,512,128,7168,256,8,0,0,asm,10005+20101,587.4498
gfx938,int8_w8a8_block,torch.float16,576,128,7168,256,8,0,0,asm,11010+21101,608.6394
gfx938,int8_w8a8_block,torch.float16,640,128,7168,256,8,0,0,asm,11010+21101,632.7871
gfx938,int8_w8a8_block,torch.float16,704,128,7168,256,8,0,0,asm,11010+21101,641.8249
gfx938,int8_w8a8_block,torch.float16,768,128,7168,256,8,0,0,asm,11010+21101,654.0136
gfx938,int8_w8a8_block,torch.float16,832,128,7168,256,8,0,0,asm,11009+21101,663.6258
gfx938,int8_w8a8_block,torch.float16,896,128,7168,256,8,0,0,asm,11006+21101,696.7302
gfx938,int8_w8a8_block,torch.float16,960,128,7168,256,8,0,0,asm,11010+21101,711.3972
gfx938,int8_w8a8_block,torch.float16,1024,128,7168,256,8,0,0,asm,11009+21101,761.4979
gfx938,int8_w8a8_block,torch.float16,1152,128,7168,256,8,0,0,asm,11010+21101,829.2662
gfx938,int8_w8a8_block,torch.float16,1280,128,7168,256,8,0,0,asm,11010+21101,870.6156
gfx938,int8_w8a8_block,torch.float16,1408,128,7168,256,8,0,0,asm,11010+21101,897.6952
gfx938,int8_w8a8_block,torch.float16,1536,128,7168,256,8,0,0,asm,11010+21101,981.7316
gfx938,int8_w8a8_block,torch.float16,1664,128,7168,256,8,0,0,asm,11010+21101,997.8185
gfx938,int8_w8a8_block,torch.float16,1792,128,7168,256,8,0,0,asm,11010+21101,1033.4067
gfx938,int8_w8a8_block,torch.float16,1920,128,7168,256,8,0,0,asm,11010+21101,1108.3387
gfx938,int8_w8a8_block,torch.float16,2048,128,7168,256,8,0,0,asm,11010+21101,1145.0203
gfx938,int8_w8a8_block,torch.float16,2304,128,7168,256,8,0,0,asm,11010+21101,1316.086
gfx938,int8_w8a8_block,torch.float16,2560,128,7168,256,8,0,0,asm,11010+21101,1387.9345
gfx938,int8_w8a8_block,torch.float16,2816,128,7168,256,8,0,0,asm,11010+21101,1488.2435
gfx938,int8_w8a8_block,torch.float16,3072,128,7168,256,8,0,0,asm,11010+21101,1620.1726
gfx938,int8_w8a8_block,torch.float16,3328,128,7168,256,8,0,0,asm,11010+21101,1742.2218
gfx938,int8_w8a8_block,torch.float16,3584,128,7168,256,8,0,0,asm,11010+21101,1862.3263
gfx938,int8_w8a8_block,torch.float16,3840,128,7168,256,8,0,0,asm,11010+21101,1934.8699
gfx938,int8_w8a8_block,torch.float16,4096,128,7168,256,8,0,0,asm,11010+21101,2045.1929
gfx938,int8_w8a8_block,torch.float16,4608,128,7168,256,8,0,0,asm,11010+21101,2279.0466
gfx938,int8_w8a8_block,torch.float16,5120,128,7168,256,8,0,0,asm,11010+21101,2509.8803
gfx938,int8_w8a8_block,torch.float16,5632,128,7168,256,8,0,0,asm,11010+21101,2757.2319
gfx938,int8_w8a8_block,torch.float16,6144,128,7168,256,8,0,0,asm,11010+21101,2985.8396
gfx938,int8_w8a8_block,torch.float16,6656,128,7168,256,8,0,0,asm,11010+21101,3184.1954
gfx938,int8_w8a8_block,torch.float16,7168,128,7168,256,8,0,0,asm,11010+21101,3425.8325
gfx938,int8_w8a8_block,torch.float16,7680,128,7168,256,8,0,0,asm,11010+21101,3647.3802
gfx938,int8_w8a8_block,torch.float16,8192,128,7168,256,8,0,0,asm,11010+21101,3867.3574
gfx938,int8_w8a8_block,torch.float16,10240,128,7168,256,8,0,0,asm,11010+21101,4765.7119
gfx938,int8_w8a8_block,torch.float16,12288,128,7168,256,8,0,0,asm,11010+21101,5724.0817
gfx938,int8_w8a8_block,torch.float16,14336,128,7168,256,8,0,0,asm,11010+21101,6569.5353
gfx938,int8_w8a8_block,torch.float16,16384,128,7168,256,8,0,0,asm,11010+21101,7444.7413
gfx938,int8_w8a8_block,torch.float16,17408,128,7168,256,8,0,0,asm,11010+21101,7919.0884
gfx938,int8_w8a8_block,torch.float16,24576,128,7168,256,8,0,0,asm,11010+21101,11183.5046
gfx938,int8_w8a8_block,torch.float16,32768,128,7168,256,8,0,0,asm,11010+21101,14692.1092
gfx938,int8_w8a8_block,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,15532.3525
gfx938,int8_w8a8_block,torch.float16,49152,128,7168,256,8,0,0,asm,11010+21101,21012.5975
gfx938,int8_w8a8_block,torch.float16,57344,128,7168,256,8,0,0,asm,11010+21101,24817.8367
gfx938,int8_w8a8_block,torch.float16,65536,128,7168,256,8,0,0,asm,11010+21101,28757.9419
gfx938,int8_w8a8_block,torch.float16,1,256,7168,256,8,0,0,asm,10007+20000,74.0639
gfx938,int8_w8a8_block,torch.float16,2,256,7168,256,8,0,0,asm,10002+20000,102.3192
gfx938,int8_w8a8_block,torch.float16,3,256,7168,256,8,0,0,asm,10006+20000,135.7052
gfx938,int8_w8a8_block,torch.float16,4,256,7168,256,8,0,0,asm,10002+20000,169.3255
gfx938,int8_w8a8_block,torch.float16,5,256,7168,256,8,0,0,asm,10002+20000,197.5692
gfx938,int8_w8a8_block,torch.float16,6,256,7168,256,8,0,0,asm,10002+20000,206.6023
gfx938,int8_w8a8_block,torch.float16,7,256,7168,256,8,0,0,asm,10003+20000,229.8469
gfx938,int8_w8a8_block,torch.float16,8,256,7168,256,8,0,0,asm,10006+20000,243.5164
gfx938,int8_w8a8_block,torch.float16,9,256,7168,256,8,0,0,asm,10006+20000,260.1334
gfx938,int8_w8a8_block,torch.float16,10,256,7168,256,8,0,0,asm,10005+20000,280.0511
gfx938,int8_w8a8_block,torch.float16,11,256,7168,256,8,0,0,asm,10002+20000,305.6738
gfx938,int8_w8a8_block,torch.float16,12,256,7168,256,8,0,0,asm,10002+20000,310.3367
gfx938,int8_w8a8_block,torch.float16,13,256,7168,256,8,0,0,asm,10001+20000,323.612
gfx938,int8_w8a8_block,torch.float16,14,256,7168,256,8,0,0,asm,10006+20000,341.7984
gfx938,int8_w8a8_block,torch.float16,15,256,7168,256,8,0,0,asm,10005+20000,359.621
gfx938,int8_w8a8_block,torch.float16,16,256,7168,256,8,0,0,asm,10006+20000,361.7879
gfx938,int8_w8a8_block,torch.float16,17,256,7168,256,8,0,0,asm,10006+20000,365.4648
gfx938,int8_w8a8_block,torch.float16,18,256,7168,256,8,0,0,asm,10005+20000,379.5129
gfx938,int8_w8a8_block,torch.float16,20,256,7168,256,8,0,0,asm,10001+20000,410.4977
gfx938,int8_w8a8_block,torch.float16,24,256,7168,256,8,0,0,asm,10006+20000,460.7313
gfx938,int8_w8a8_block,torch.float16,28,256,7168,256,8,0,0,asm,10002+20000,523.8077
gfx938,int8_w8a8_block,torch.float16,32,256,7168,256,8,0,0,asm,10006+20000,555.1036
gfx938,int8_w8a8_block,torch.float16,34,256,7168,256,8,0,0,asm,10006+20000,554.0263
gfx938,int8_w8a8_block,torch.float16,36,256,7168,256,8,0,0,asm,10002+20000,572.3591
gfx938,int8_w8a8_block,torch.float16,40,256,7168,256,8,0,0,asm,10001+20000,593.9758
gfx938,int8_w8a8_block,torch.float16,44,256,7168,256,8,0,0,asm,10001+20000,617.3905
gfx938,int8_w8a8_block,torch.float16,48,256,7168,256,8,0,0,asm,10001+20000,633.2489
gfx938,int8_w8a8_block,torch.float16,56,256,7168,256,8,0,0,asm,10002+20000,662.2223
gfx938,int8_w8a8_block,torch.float16,64,256,7168,256,8,0,0,asm,10002+20000,685.0154
gfx938,int8_w8a8_block,torch.float16,68,256,7168,256,8,0,0,asm,10001+20000,695.8222
gfx938,int8_w8a8_block,torch.float16,72,256,7168,256,8,0,0,asm,10001+20000,709.9707
gfx938,int8_w8a8_block,torch.float16,80,256,7168,256,8,0,0,asm,10001+20000,774.6035
gfx938,int8_w8a8_block,torch.float16,88,256,7168,256,8,0,0,asm,10002+20000,757.6815
gfx938,int8_w8a8_block,torch.float16,96,256,7168,256,8,0,0,asm,10002+20000,760.8093
gfx938,int8_w8a8_block,torch.float16,104,256,7168,256,8,0,0,asm,10002+20000,779.7121
gfx938,int8_w8a8_block,torch.float16,112,256,7168,256,8,0,0,asm,10002+20000,776.0946
gfx938,int8_w8a8_block,torch.float16,128,256,7168,256,8,0,0,asm,10002+20000,792.7909
gfx938,int8_w8a8_block,torch.float16,144,256,7168,256,8,0,0,asm,10002+20000,800.8822
gfx938,int8_w8a8_block,torch.float16,160,256,7168,256,8,0,0,asm,10002+20000,812.1142
gfx938,int8_w8a8_block,torch.float16,192,256,7168,256,8,0,0,asm,10002+20000,825.0625
gfx938,int8_w8a8_block,torch.float16,224,256,7168,256,8,0,0,asm,10002+20000,833.9061
gfx938,int8_w8a8_block,torch.float16,256,256,7168,256,8,0,0,asm,10002+20000,844.1267
gfx938,int8_w8a8_block,torch.float16,320,256,7168,256,8,0,0,asm,10002+20000,872.8442
gfx938,int8_w8a8_block,torch.float16,384,256,7168,256,8,0,0,asm,10005+20000,903.3915
gfx938,int8_w8a8_block,torch.float16,448,256,7168,256,8,0,0,asm,10006+20000,945.5806
gfx938,int8_w8a8_block,torch.float16,512,256,7168,256,8,0,0,asm,11006+21000,960.4355
gfx938,int8_w8a8_block,torch.float16,576,256,7168,256,8,0,0,asm,11006+21000,975.8254
gfx938,int8_w8a8_block,torch.float16,640,256,7168,256,8,0,0,asm,11006+21000,997.3548
gfx938,int8_w8a8_block,torch.float16,704,256,7168,256,8,0,0,asm,11006+21000,1015.4870000000001
gfx938,int8_w8a8_block,torch.float16,768,256,7168,256,8,0,0,asm,11010+21000,1032.7099
gfx938,int8_w8a8_block,torch.float16,832,256,7168,256,8,0,0,asm,11010+21000,1051.2385
gfx938,int8_w8a8_block,torch.float16,896,256,7168,256,8,0,0,asm,11010+21000,1096.4795
gfx938,int8_w8a8_block,torch.float16,960,256,7168,256,8,0,0,asm,11010+21000,1153.3346
gfx938,int8_w8a8_block,torch.float16,1024,256,7168,256,8,0,0,asm,11010+21000,1210.1494
gfx938,int8_w8a8_block,torch.float16,1152,256,7168,256,8,0,0,asm,11010+21000,1356.8225
gfx938,int8_w8a8_block,torch.float16,1280,256,7168,256,8,0,0,asm,12003+22000,1430.5484
gfx938,int8_w8a8_block,torch.float16,1408,256,7168,256,8,0,0,asm,12003+22000,1462.7597
gfx938,int8_w8a8_block,torch.float16,1536,256,7168,256,8,0,0,asm,12003+22000,1491.0231
gfx938,int8_w8a8_block,torch.float16,1664,256,7168,256,8,0,0,asm,12003+22000,1532.0672
gfx938,int8_w8a8_block,torch.float16,1792,256,7168,256,8,0,0,asm,12003+22000,1634.4874
gfx938,int8_w8a8_block,torch.float16,1920,256,7168,256,8,0,0,asm,12003+22000,1704.1272
gfx938,int8_w8a8_block,torch.float16,2048,256,7168,256,8,0,0,asm,11010+21000,1906.7057
gfx938,int8_w8a8_block,torch.float16,2304,256,7168,256,8,0,0,asm,11010+21000,2163.0306
gfx938,int8_w8a8_block,torch.float16,2560,256,7168,256,8,0,0,asm,11010+21000,2300.1239
gfx938,int8_w8a8_block,torch.float16,2816,256,7168,256,8,0,0,asm,11010+21000,2437.1261
gfx938,int8_w8a8_block,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23000,2637.9526
gfx938,int8_w8a8_block,torch.float16,3328,256,7168,256,8,0,0,asm,12003+22000,2726.2909
gfx938,int8_w8a8_block,torch.float16,3584,256,7168,256,8,0,0,asm,12003+22000,2809.1701
gfx938,int8_w8a8_block,torch.float16,3840,256,7168,256,8,0,0,asm,12003+22000,2992.6435
gfx938,int8_w8a8_block,torch.float16,4096,256,7168,256,8,0,0,asm,12003+22000,3289.1543
gfx938,int8_w8a8_block,torch.float16,4608,256,7168,256,8,0,0,asm,11010+21000,3804.5302
gfx938,int8_w8a8_block,torch.float16,5120,256,7168,256,8,0,0,asm,12003+22000,4015.5876
gfx938,int8_w8a8_block,torch.float16,5632,256,7168,256,8,0,0,asm,12003+22000,4216.9662
gfx938,int8_w8a8_block,torch.float16,6144,256,7168,256,8,0,0,asm,12003+22000,4648.8637
gfx938,int8_w8a8_block,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23000,4987.557
gfx938,int8_w8a8_block,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23000,5097.7043
gfx938,int8_w8a8_block,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23000,5418.374
gfx938,int8_w8a8_block,torch.float16,8192,256,7168,256,8,0,0,asm,12003+22000,5973.1091
gfx938,int8_w8a8_block,torch.float16,10240,256,7168,256,8,0,0,asm,12003+22000,7325.1873
gfx938,int8_w8a8_block,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23000,8555.6002
gfx938,int8_w8a8_block,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23000,9886.2731
gfx938,int8_w8a8_block,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23000,11056.8632
gfx938,int8_w8a8_block,torch.float16,17408,256,7168,256,8,0,0,asm,12003+22000,12029.4321
gfx938,int8_w8a8_block,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23000,16199.1447
gfx938,int8_w8a8_block,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23000,21211.1206
gfx938,int8_w8a8_block,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23000,25292.6729
gfx938,int8_w8a8_block,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23000,30310.2679
gfx938,int8_w8a8_block,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23000,35514.6339
gfx938,int8_w8a8_block,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23000,40549.9911
gfx938,f8_w8a8_block,torch.float16,1,128,7168,256,8,0,0,asm,10008+20000,64.5697
gfx938,f8_w8a8_block,torch.float16,2,128,7168,256,8,0,0,asm,10007+20101,75.7958
gfx938,f8_w8a8_block,torch.float16,3,128,7168,256,8,0,0,asm,10002+20101,88.1569
gfx938,f8_w8a8_block,torch.float16,4,128,7168,256,8,0,0,asm,10002+20101,101.3875
gfx938,f8_w8a8_block,torch.float16,5,128,7168,256,8,0,0,asm,10004+20101,124.3946
gfx938,f8_w8a8_block,torch.float16,6,128,7168,256,8,0,0,asm,10006+20101,130.9464
gfx938,f8_w8a8_block,torch.float16,7,128,7168,256,8,0,0,asm,10006+20101,137.4365
gfx938,f8_w8a8_block,torch.float16,8,128,7168,256,8,0,0,asm,10006+20101,143.0817
gfx938,f8_w8a8_block,torch.float16,9,128,7168,256,8,0,0,asm,10002+20101,157.5882
gfx938,f8_w8a8_block,torch.float16,10,128,7168,256,8,0,0,asm,10002+20101,168.0538
gfx938,f8_w8a8_block,torch.float16,11,128,7168,256,8,0,0,asm,10002+20101,198.4332
gfx938,f8_w8a8_block,torch.float16,12,128,7168,256,8,0,0,asm,10007+20101,200.4189
gfx938,f8_w8a8_block,torch.float16,13,128,7168,256,8,0,0,asm,10002+20101,203.4917
gfx938,f8_w8a8_block,torch.float16,14,128,7168,256,8,0,0,asm,10002+20101,206.6752
gfx938,f8_w8a8_block,torch.float16,15,128,7168,256,8,0,0,asm,10002+20101,211.3234
gfx938,f8_w8a8_block,torch.float16,16,128,7168,256,8,0,0,asm,10002+20101,215.7665
gfx938,f8_w8a8_block,torch.float16,17,128,7168,256,8,0,0,asm,10002+20101,218.0528
gfx938,f8_w8a8_block,torch.float16,18,128,7168,256,8,0,0,asm,10001+20101,226.9306
gfx938,f8_w8a8_block,torch.float16,20,128,7168,256,8,0,0,asm,10006+20101,249.3592
gfx938,f8_w8a8_block,torch.float16,24,128,7168,256,8,0,0,asm,10006+20101,273.2813
gfx938,f8_w8a8_block,torch.float16,28,128,7168,256,8,0,0,asm,10002+20101,326.4696
gfx938,f8_w8a8_block,torch.float16,32,128,7168,256,8,0,0,asm,10001+20101,334.1086
gfx938,f8_w8a8_block,torch.float16,34,128,7168,256,8,0,0,asm,10002+20101,322.4625
gfx938,f8_w8a8_block,torch.float16,36,128,7168,256,8,0,0,asm,10002+20101,332.4153
gfx938,f8_w8a8_block,torch.float16,40,128,7168,256,8,0,0,asm,10005+20101,359.0573
gfx938,f8_w8a8_block,torch.float16,44,128,7168,256,8,0,0,asm,10005+20101,371.3075
gfx938,f8_w8a8_block,torch.float16,48,128,7168,256,8,0,0,asm,10006+20101,377.0101
gfx938,f8_w8a8_block,torch.float16,56,128,7168,256,8,0,0,asm,10002+20101,386.4541
gfx938,f8_w8a8_block,torch.float16,64,128,7168,256,8,0,0,asm,10002+20101,414.1463
gfx938,f8_w8a8_block,torch.float16,68,128,7168,256,8,0,0,asm,10002+20101,423.1842
gfx938,f8_w8a8_block,torch.float16,72,128,7168,256,8,0,0,asm,10002+20100,456.7184
gfx938,f8_w8a8_block,torch.float16,80,128,7168,256,8,0,0,asm,10007+20101,448.1646
gfx938,f8_w8a8_block,torch.float16,88,128,7168,256,8,0,0,asm,10002+20101,448.0963
gfx938,f8_w8a8_block,torch.float16,96,128,7168,256,8,0,0,asm,10002+20101,447.221
gfx938,f8_w8a8_block,torch.float16,104,128,7168,256,8,0,0,asm,10001+20101,459.5944
gfx938,f8_w8a8_block,torch.float16,112,128,7168,256,8,0,0,asm,10001+20101,457.5964
gfx938,f8_w8a8_block,torch.float16,128,128,7168,256,8,0,0,asm,10002+20101,465.9861
gfx938,f8_w8a8_block,torch.float16,144,128,7168,256,8,0,0,asm,10002+20101,487.6434
gfx938,f8_w8a8_block,torch.float16,160,128,7168,256,8,0,0,asm,10002+20101,493.5511
gfx938,f8_w8a8_block,torch.float16,192,128,7168,256,8,0,0,asm,10001+20101,501.9257
gfx938,f8_w8a8_block,torch.float16,224,128,7168,256,8,0,0,asm,10005+20101,507.8977
gfx938,f8_w8a8_block,torch.float16,256,128,7168,256,8,0,0,asm,10002+20101,511.9018
gfx938,f8_w8a8_block,torch.float16,320,128,7168,256,8,0,0,asm,10005+20101,532.5335
gfx938,f8_w8a8_block,torch.float16,384,128,7168,256,8,0,0,asm,10002+20101,538.9704
gfx938,f8_w8a8_block,torch.float16,448,128,7168,256,8,0,0,asm,10002+20101,565.112
gfx938,f8_w8a8_block,torch.float16,512,128,7168,256,8,0,0,asm,10006+20101,588.5628
gfx938,f8_w8a8_block,torch.float16,576,128,7168,256,8,0,0,asm,11010+21101,614.6829
gfx938,f8_w8a8_block,torch.float16,640,128,7168,256,8,0,0,asm,11010+21101,628.6065
gfx938,f8_w8a8_block,torch.float16,704,128,7168,256,8,0,0,asm,11010+21101,634.5557
gfx938,f8_w8a8_block,torch.float16,768,128,7168,256,8,0,0,asm,11010+21101,650.5685
gfx938,f8_w8a8_block,torch.float16,832,128,7168,256,8,0,0,asm,11010+21101,657.2756
gfx938,f8_w8a8_block,torch.float16,896,128,7168,256,8,0,0,asm,11006+21101,696.1905
gfx938,f8_w8a8_block,torch.float16,960,128,7168,256,8,0,0,asm,11010+21101,708.2019
gfx938,f8_w8a8_block,torch.float16,1024,128,7168,256,8,0,0,asm,11010+21101,757.7168
gfx938,f8_w8a8_block,torch.float16,1152,128,7168,256,8,0,0,asm,11010+21101,829.2878
gfx938,f8_w8a8_block,torch.float16,1280,128,7168,256,8,0,0,asm,11010+21101,868.635
gfx938,f8_w8a8_block,torch.float16,1408,128,7168,256,8,0,0,asm,11010+21101,899.1951
gfx938,f8_w8a8_block,torch.float16,1536,128,7168,256,8,0,0,asm,11010+21101,975.7805
gfx938,f8_w8a8_block,torch.float16,1664,128,7168,256,8,0,0,asm,11010+21101,996.4617
gfx938,f8_w8a8_block,torch.float16,1792,128,7168,256,8,0,0,asm,11010+21101,1030.6891
gfx938,f8_w8a8_block,torch.float16,1920,128,7168,256,8,0,0,asm,11010+21101,1101.5501
gfx938,f8_w8a8_block,torch.float16,2048,128,7168,256,8,0,0,asm,11010+21101,1145.2352
gfx938,f8_w8a8_block,torch.float16,2304,128,7168,256,8,0,0,asm,11010+21101,1308.0337
gfx938,f8_w8a8_block,torch.float16,2560,128,7168,256,8,0,0,asm,11010+21101,1375.4024
gfx938,f8_w8a8_block,torch.float16,2816,128,7168,256,8,0,0,asm,11010+21101,1478.738
gfx938,f8_w8a8_block,torch.float16,3072,128,7168,256,8,0,0,asm,11010+21101,1602.2884
gfx938,f8_w8a8_block,torch.float16,3328,128,7168,256,8,0,0,asm,11010+21101,1727.6481
gfx938,f8_w8a8_block,torch.float16,3584,128,7168,256,8,0,0,asm,11010+21101,1849.196
gfx938,f8_w8a8_block,torch.float16,3840,128,7168,256,8,0,0,asm,11010+21101,1911.3202
gfx938,f8_w8a8_block,torch.float16,4096,128,7168,256,8,0,0,asm,11010+21101,2019.8641
gfx938,f8_w8a8_block,torch.float16,4608,128,7168,256,8,0,0,asm,11010+21101,2259.4566
gfx938,f8_w8a8_block,torch.float16,5120,128,7168,256,8,0,0,asm,11010+21101,2484.118
gfx938,f8_w8a8_block,torch.float16,5632,128,7168,256,8,0,0,asm,11010+21101,2722.4067
gfx938,f8_w8a8_block,torch.float16,6144,128,7168,256,8,0,0,asm,11010+21101,2944.3125
gfx938,f8_w8a8_block,torch.float16,6656,128,7168,256,8,0,0,asm,11010+21101,3141.9019
gfx938,f8_w8a8_block,torch.float16,7168,128,7168,256,8,0,0,asm,11010+21101,3375.1217
gfx938,f8_w8a8_block,torch.float16,7680,128,7168,256,8,0,0,asm,11010+21101,3597.4721
gfx938,f8_w8a8_block,torch.float16,8192,128,7168,256,8,0,0,asm,11010+21101,3816.3838
gfx938,f8_w8a8_block,torch.float16,10240,128,7168,256,8,0,0,asm,11010+21101,4706.2116
gfx938,f8_w8a8_block,torch.float16,12288,128,7168,256,8,0,0,asm,11010+21101,5647.2745
gfx938,f8_w8a8_block,torch.float16,14336,128,7168,256,8,0,0,asm,11010+21101,6490.2357
gfx938,f8_w8a8_block,torch.float16,16384,128,7168,256,8,0,0,asm,11010+21101,7346.2153
gfx938,f8_w8a8_block,torch.float16,17408,128,7168,256,8,0,0,asm,11010+21101,7819.7326
gfx938,f8_w8a8_block,torch.float16,24576,128,7168,256,8,0,0,asm,11010+21101,11024.8311
gfx938,f8_w8a8_block,torch.float16,32768,128,7168,256,8,0,0,asm,11010+21101,14518.6201
gfx938,f8_w8a8_block,torch.float16,40960,128,7168,256,8,0,0,asm,13001+23101,14697.0981
gfx938,f8_w8a8_block,torch.float16,49152,128,7168,256,8,0,0,asm,11010+21101,20838.8615
gfx938,f8_w8a8_block,torch.float16,57344,128,7168,256,8,0,0,asm,11010+21101,24568.6648
gfx938,f8_w8a8_block,torch.float16,65536,128,7168,256,8,0,0,asm,13001+23000,28256.1414
gfx938,f8_w8a8_block,torch.float16,1,256,7168,256,8,0,0,asm,10007+20000,72.6803
gfx938,f8_w8a8_block,torch.float16,2,256,7168,256,8,0,0,asm,10002+20000,103.4148
gfx938,f8_w8a8_block,torch.float16,3,256,7168,256,8,0,0,asm,10005+20000,134.748
gfx938,f8_w8a8_block,torch.float16,4,256,7168,256,8,0,0,asm,10006+20000,166.8146
gfx938,f8_w8a8_block,torch.float16,5,256,7168,256,8,0,0,asm,10001+20000,199.2455
gfx938,f8_w8a8_block,torch.float16,6,256,7168,256,8,0,0,asm,10002+20000,209.641
gfx938,f8_w8a8_block,torch.float16,7,256,7168,256,8,0,0,asm,10002+20000,225.1832
gfx938,f8_w8a8_block,torch.float16,8,256,7168,256,8,0,0,asm,10006+20000,240.6587
gfx938,f8_w8a8_block,torch.float16,9,256,7168,256,8,0,0,asm,10005+20000,259.4617
gfx938,f8_w8a8_block,torch.float16,10,256,7168,256,8,0,0,asm,10006+20000,275.2421
gfx938,f8_w8a8_block,torch.float16,11,256,7168,256,8,0,0,asm,10002+20000,312.0341
gfx938,f8_w8a8_block,torch.float16,12,256,7168,256,8,0,0,asm,10002+20000,309.8362
gfx938,f8_w8a8_block,torch.float16,13,256,7168,256,8,0,0,asm,10002+20000,321.2168
gfx938,f8_w8a8_block,torch.float16,14,256,7168,256,8,0,0,asm,10006+20000,342.3694
gfx938,f8_w8a8_block,torch.float16,15,256,7168,256,8,0,0,asm,10006+20000,352.1916
gfx938,f8_w8a8_block,torch.float16,16,256,7168,256,8,0,0,asm,10006+20000,359.8449
gfx938,f8_w8a8_block,torch.float16,17,256,7168,256,8,0,0,asm,10006+20000,365.372
gfx938,f8_w8a8_block,torch.float16,18,256,7168,256,8,0,0,asm,10006+20000,378.5073
gfx938,f8_w8a8_block,torch.float16,20,256,7168,256,8,0,0,asm,10002+20000,408.3221
gfx938,f8_w8a8_block,torch.float16,24,256,7168,256,8,0,0,asm,10006+20000,459.4637
gfx938,f8_w8a8_block,torch.float16,28,256,7168,256,8,0,0,asm,10002+20000,521.102
gfx938,f8_w8a8_block,torch.float16,32,256,7168,256,8,0,0,asm,10006+20000,554.6966
gfx938,f8_w8a8_block,torch.float16,34,256,7168,256,8,0,0,asm,10006+20000,551.9878
gfx938,f8_w8a8_block,torch.float16,36,256,7168,256,8,0,0,asm,10002+20000,564.9833
gfx938,f8_w8a8_block,torch.float16,40,256,7168,256,8,0,0,asm,10002+20000,595.1432
gfx938,f8_w8a8_block,torch.float16,44,256,7168,256,8,0,0,asm,10002+20000,619.5608
gfx938,f8_w8a8_block,torch.float16,48,256,7168,256,8,0,0,asm,10002+20000,628.6184
gfx938,f8_w8a8_block,torch.float16,56,256,7168,256,8,0,0,asm,10002+20000,662.9176
gfx938,f8_w8a8_block,torch.float16,64,256,7168,256,8,0,0,asm,10002+20000,687.9598
gfx938,f8_w8a8_block,torch.float16,68,256,7168,256,8,0,0,asm,10002+20000,689.9695
gfx938,f8_w8a8_block,torch.float16,72,256,7168,256,8,0,0,asm,10002+20000,711.1765
gfx938,f8_w8a8_block,torch.float16,80,256,7168,256,8,0,0,asm,10002+20000,726.5693
gfx938,f8_w8a8_block,torch.float16,88,256,7168,256,8,0,0,asm,10002+20000,754.9446
gfx938,f8_w8a8_block,torch.float16,96,256,7168,256,8,0,0,asm,10002+20000,757.3035
gfx938,f8_w8a8_block,torch.float16,104,256,7168,256,8,0,0,asm,10002+20000,776.5309
gfx938,f8_w8a8_block,torch.float16,112,256,7168,256,8,0,0,asm,10002+20000,779.1336
gfx938,f8_w8a8_block,torch.float16,128,256,7168,256,8,0,0,asm,10002+20000,794.9824
gfx938,f8_w8a8_block,torch.float16,144,256,7168,256,8,0,0,asm,10002+20000,802.5377
gfx938,f8_w8a8_block,torch.float16,160,256,7168,256,8,0,0,asm,10002+20000,810.6245
gfx938,f8_w8a8_block,torch.float16,192,256,7168,256,8,0,0,asm,10001+20000,822.7867
gfx938,f8_w8a8_block,torch.float16,224,256,7168,256,8,0,0,asm,10002+20000,831.9725
gfx938,f8_w8a8_block,torch.float16,256,256,7168,256,8,0,0,asm,10002+20000,842.2666
gfx938,f8_w8a8_block,torch.float16,320,256,7168,256,8,0,0,asm,10002+20000,873.6665
gfx938,f8_w8a8_block,torch.float16,384,256,7168,256,8,0,0,asm,10006+20000,905.6093
gfx938,f8_w8a8_block,torch.float16,448,256,7168,256,8,0,0,asm,11006+21000,940.6409
gfx938,f8_w8a8_block,torch.float16,512,256,7168,256,8,0,0,asm,11006+21000,955.3874
gfx938,f8_w8a8_block,torch.float16,576,256,7168,256,8,0,0,asm,11006+21000,970.2529
gfx938,f8_w8a8_block,torch.float16,640,256,7168,256,8,0,0,asm,11006+21000,985.9352
gfx938,f8_w8a8_block,torch.float16,704,256,7168,256,8,0,0,asm,11006+21000,1008.4660
gfx938,f8_w8a8_block,torch.float16,768,256,7168,256,8,0,0,asm,11010+21000,1026.7544
gfx938,f8_w8a8_block,torch.float16,832,256,7168,256,8,0,0,asm,11010+21000,1039.0986
gfx938,f8_w8a8_block,torch.float16,896,256,7168,256,8,0,0,asm,11010+21000,1083.3307
gfx938,f8_w8a8_block,torch.float16,960,256,7168,256,8,0,0,asm,11010+21000,1143.5322
gfx938,f8_w8a8_block,torch.float16,1024,256,7168,256,8,0,0,asm,11010+21000,1199.3986
gfx938,f8_w8a8_block,torch.float16,1152,256,7168,256,8,0,0,asm,11010+21000,1338.1607
gfx938,f8_w8a8_block,torch.float16,1280,256,7168,256,8,0,0,asm,12003+22000,1385.7713
gfx938,f8_w8a8_block,torch.float16,1408,256,7168,256,8,0,0,asm,12003+22000,1423.7195
gfx938,f8_w8a8_block,torch.float16,1536,256,7168,256,8,0,0,asm,12003+22000,1453.7754
gfx938,f8_w8a8_block,torch.float16,1664,256,7168,256,8,0,0,asm,12003+22000,1476.8312
gfx938,f8_w8a8_block,torch.float16,1792,256,7168,256,8,0,0,asm,12003+22000,1577.4284
gfx938,f8_w8a8_block,torch.float16,1920,256,7168,256,8,0,0,asm,12003+22000,1625.2879
gfx938,f8_w8a8_block,torch.float16,2048,256,7168,256,8,0,0,asm,12003+22000,1835.2787
gfx938,f8_w8a8_block,torch.float16,2304,256,7168,256,8,0,0,asm,11010+21000,2116.7298
gfx938,f8_w8a8_block,torch.float16,2560,256,7168,256,8,0,0,asm,11010+21000,2245.6297
gfx938,f8_w8a8_block,torch.float16,2816,256,7168,256,8,0,0,asm,11010+21000,2377.2784
gfx938,f8_w8a8_block,torch.float16,3072,256,7168,256,8,0,0,asm,13001+23000,2465.8043
gfx938,f8_w8a8_block,torch.float16,3328,256,7168,256,8,0,0,asm,13001+23000,2540.153
gfx938,f8_w8a8_block,torch.float16,3584,256,7168,256,8,0,0,asm,13001+23000,2627.0902
gfx938,f8_w8a8_block,torch.float16,3840,256,7168,256,8,0,0,asm,12003+22000,2800.8796
gfx938,f8_w8a8_block,torch.float16,4096,256,7168,256,8,0,0,asm,12003+22000,3084.2312
gfx938,f8_w8a8_block,torch.float16,4608,256,7168,256,8,0,0,asm,12003+22000,3563.8115
gfx938,f8_w8a8_block,torch.float16,5120,256,7168,256,8,0,0,asm,12003+22000,3755.4826
gfx938,f8_w8a8_block,torch.float16,5632,256,7168,256,8,0,0,asm,12003+22000,3950.6285
gfx938,f8_w8a8_block,torch.float16,6144,256,7168,256,8,0,0,asm,12003+22000,4354.9376
gfx938,f8_w8a8_block,torch.float16,6656,256,7168,256,8,0,0,asm,13001+23000,4595.7098
gfx938,f8_w8a8_block,torch.float16,7168,256,7168,256,8,0,0,asm,13001+23000,4714.1942
gfx938,f8_w8a8_block,torch.float16,7680,256,7168,256,8,0,0,asm,13001+23000,5001.5109
gfx938,f8_w8a8_block,torch.float16,8192,256,7168,256,8,0,0,asm,13001+23000,5565.8363
gfx938,f8_w8a8_block,torch.float16,10240,256,7168,256,8,0,0,asm,13001+23000,6804.4078
gfx938,f8_w8a8_block,torch.float16,12288,256,7168,256,8,0,0,asm,13001+23000,7889.1483
gfx938,f8_w8a8_block,torch.float16,14336,256,7168,256,8,0,0,asm,13001+23000,9148.5336
gfx938,f8_w8a8_block,torch.float16,16384,256,7168,256,8,0,0,asm,13001+23000,10246.3196
gfx938,f8_w8a8_block,torch.float16,17408,256,7168,256,8,0,0,asm,13001+23000,11124.6754
gfx938,f8_w8a8_block,torch.float16,24576,256,7168,256,8,0,0,asm,13001+23000,14963.2569
gfx938,f8_w8a8_block,torch.float16,32768,256,7168,256,8,0,0,asm,13001+23000,19704.3071
gfx938,f8_w8a8_block,torch.float16,40960,256,7168,256,8,0,0,asm,13001+23000,23143.0651
gfx938,f8_w8a8_block,torch.float16,49152,256,7168,256,8,0,0,asm,13001+23000,27894.5593
gfx938,f8_w8a8_block,torch.float16,57344,256,7168,256,8,0,0,asm,13001+23000,32751.0668
gfx938,f8_w8a8_block,torch.float16,65536,256,7168,256,8,0,0,asm,13001+23000,37602.0424
gfx938,f8_w8a8_block,torch.float16,1,512,7168,256,8,0,0,asm,10001+20000,98.9608
gfx938,f8_w8a8_block,torch.float16,2,512,7168,256,8,0,0,asm,10005+20000,148.7373
gfx938,f8_w8a8_block,torch.float16,4,512,7168,256,8,0,0,asm,10002+20000,255.7451
gfx938,f8_w8a8_block,torch.float16,6,512,7168,256,8,0,0,asm,10006+20000,331.7556
gfx938,f8_w8a8_block,torch.float16,8,512,7168,256,8,0,0,asm,10001+20000,402.7571
gfx938,f8_w8a8_block,torch.float16,16,512,7168,256,8,0,0,asm,10002+20000,620.9451
gfx938,f8_w8a8_block,torch.float16,24,512,7168,256,8,0,0,asm,10002+20000,813.7066
gfx938,f8_w8a8_block,torch.float16,32,512,7168,256,8,0,0,asm,10001+20000,977.7223
gfx938,f8_w8a8_block,torch.float16,48,512,7168,256,8,0,0,asm,10002+20000,1144.5069
gfx938,f8_w8a8_block,torch.float16,56,512,7168,256,8,0,0,asm,10001+20000,1205.4824
gfx938,f8_w8a8_block,torch.float16,64,512,7168,256,8,0,0,asm,10002+20000,1248.6146
gfx938,f8_w8a8_block,torch.float16,68,512,7168,256,8,0,0,asm,10002+20000,1261.4766
gfx938,f8_w8a8_block,torch.float16,72,512,7168,256,8,0,0,asm,10001+20000,1295.1417
gfx938,f8_w8a8_block,torch.float16,80,512,7168,256,8,0,0,asm,10002+20000,1328.6098
gfx938,f8_w8a8_block,torch.float16,88,512,7168,256,8,0,0,asm,10002+20000,1374.6385
gfx938,f8_w8a8_block,torch.float16,90,512,7168,256,8,0,0,asm,11006+21000,1422.9087
gfx938,f8_w8a8_block,torch.float16,96,512,7168,256,8,0,0,asm,10002+20000,1393.8895
gfx938,f8_w8a8_block,torch.float16,100,512,7168,256,8,0,0,asm,10002+20000,1392.3682
gfx938,f8_w8a8_block,torch.float16,112,512,7168,256,8,0,0,asm,10002+20000,1428.6178
gfx938,f8_w8a8_block,torch.float16,128,512,7168,256,8,0,0,asm,10002+20000,1454.5895
gfx938,f8_w8a8_block,torch.float16,160,512,7168,256,8,0,0,asm,10002+20000,1480.1684
gfx938,f8_w8a8_block,torch.float16,224,512,7168,256,8,0,0,asm,10002+20000,1509.5907
gfx938,f8_w8a8_block,torch.float16,256,512,7168,256,8,0,0,asm,10002+20000,1523.7349
gfx938,f8_w8a8_block,torch.float16,384,512,7168,256,8,0,0,asm,11005+21000,1591.8786
gfx938,f8_w8a8_block,torch.float16,512,512,7168,256,8,0,0,asm,11006+21000,1629.0737
gfx938,f8_w8a8_block,torch.float16,640,512,7168,256,8,0,0,asm,11006+21000,1673.5754
gfx938,f8_w8a8_block,torch.float16,768,512,7168,256,8,0,0,asm,11010+21000,1724.7656
gfx938,f8_w8a8_block,torch.float16,1024,512,7168,256,8,0,0,asm,11010+21000,1932.1925
gfx938,f8_w8a8_block,torch.float16,1536,512,7168,256,8,0,0,asm,12003+22000,2149.6496
gfx938,f8_w8a8_block,torch.float16,2048,512,7168,256,8,0,0,asm,12003+22000,2760.8171
gfx938,f8_w8a8_block,torch.float16,3072,512,7168,256,8,0,0,asm,13001+23000,3618.1797
gfx938,f8_w8a8_block,torch.float16,4096,512,7168,256,8,0,0,asm,12003+22000,4654.0263
gfx938,f8_w8a8_block,torch.float16,6144,512,7168,256,8,0,0,asm,12003+22000,6558.0078
gfx938,f8_w8a8_block,torch.float16,7168,512,7168,256,8,0,0,asm,13001+23000,7055.2258
gfx938,f8_w8a8_block,torch.float16,7680,512,7168,256,8,0,0,asm,13001+23000,7456.4795
gfx938,f8_w8a8_block,torch.float16,8192,512,7168,256,8,0,0,asm,13001+23000,8370.6686
gfx938,f8_w8a8_block,torch.float16,12288,512,7168,256,8,0,0,asm,13001+23000,11901.9833
gfx938,f8_w8a8_block,torch.float16,16384,512,7168,256,8,0,0,asm,13001+23000,15240.726
gfx938,f8_w8a8_block,torch.float16,1,1024,7168,256,8,0,0,asm,10006+20000,151.2889
gfx938,f8_w8a8_block,torch.float16,2,1024,7168,256,8,0,0,asm,10006+20000,237.6805
gfx938,f8_w8a8_block,torch.float16,4,1024,7168,256,8,0,0,asm,10006+20000,429.1105
gfx938,f8_w8a8_block,torch.float16,6,1024,7168,256,8,0,0,asm,10001+20000,578.6652
gfx938,f8_w8a8_block,torch.float16,8,1024,7168,256,8,0,0,asm,10002+20000,704.0545
gfx938,f8_w8a8_block,torch.float16,16,1024,7168,256,8,0,0,asm,10001+20000,1138.7775
gfx938,f8_w8a8_block,torch.float16,24,1024,7168,256,8,0,0,asm,10001+20000,1531.4521
gfx938,f8_w8a8_block,torch.float16,32,1024,7168,256,8,0,0,asm,10002+20000,1861.577
gfx938,f8_w8a8_block,torch.float16,48,1024,7168,256,8,0,0,asm,10002+20000,2205.7991
gfx938,f8_w8a8_block,torch.float16,56,1024,7168,256,8,0,0,asm,10002+20000,2319.8525
gfx938,f8_w8a8_block,torch.float16,64,1024,7168,256,8,0,0,asm,10001+20000,2411.5447
gfx938,f8_w8a8_block,torch.float16,68,1024,7168,256,8,0,0,asm,10002+20000,2432.3937
gfx938,f8_w8a8_block,torch.float16,72,1024,7168,256,8,0,0,asm,10002+20000,2542.6718
gfx938,f8_w8a8_block,torch.float16,80,1024,7168,256,8,0,0,asm,11005+21000,2595.5271
gfx938,f8_w8a8_block,torch.float16,88,1024,7168,256,8,0,0,asm,10001+20000,2651.8934
gfx938,f8_w8a8_block,torch.float16,90,1024,7168,256,8,0,0,asm,10002+20000,2716.6178
gfx938,f8_w8a8_block,torch.float16,96,1024,7168,256,8,0,0,asm,10002+20000,2688.2667
gfx938,f8_w8a8_block,torch.float16,100,1024,7168,256,8,0,0,asm,10002+20000,2684.4469
gfx938,f8_w8a8_block,torch.float16,112,1024,7168,256,8,0,0,asm,10002+20000,2754.0411
gfx938,f8_w8a8_block,torch.float16,128,1024,7168,256,8,0,0,asm,10002+20000,2795.1093
gfx938,f8_w8a8_block,torch.float16,160,1024,7168,256,8,0,0,asm,10001+20000,2857.7264
gfx938,f8_w8a8_block,torch.float16,224,1024,7168,256,8,0,0,asm,10001+20000,2896.1117
gfx938,f8_w8a8_block,torch.float16,256,1024,7168,256,8,0,0,asm,10002+20000,2914.3146
gfx938,f8_w8a8_block,torch.float16,384,1024,7168,256,8,0,0,asm,11005+21000,2997.6185
gfx938,f8_w8a8_block,torch.float16,512,1024,7168,256,8,0,0,asm,11010+21000,3053.1762
gfx938,f8_w8a8_block,torch.float16,640,1024,7168,256,8,0,0,asm,11010+21000,3092.1409
gfx938,f8_w8a8_block,torch.float16,768,1024,7168,256,8,0,0,asm,11010+21000,3186.2115
gfx938,f8_w8a8_block,torch.float16,1024,1024,7168,256,8,0,0,asm,12003+22000,3407.8668
gfx938,f8_w8a8_block,torch.float16,1536,1024,7168,256,8,0,0,asm,12003+22000,3576.4024
gfx938,f8_w8a8_block,torch.float16,2048,1024,7168,256,8,0,0,asm,12003+22000,4605.3776
gfx938,f8_w8a8_block,torch.float16,3072,1024,7168,256,8,0,0,asm,13001+23000,5888.471
gfx938,f8_w8a8_block,torch.float16,4096,1024,7168,256,8,0,0,asm,12003+22000,7722.4229
gfx938,f8_w8a8_block,torch.float16,6144,1024,7168,256,8,0,0,asm,12003+22000,10916.0147
gfx938,f8_w8a8_block,torch.float16,7168,1024,7168,256,8,0,0,asm,13001+23000,11507.4329
gfx938,f8_w8a8_block,torch.float16,7680,1024,7168,256,8,0,0,asm,13001+23000,12128.7707
gfx938,f8_w8a8_block,torch.float16,8192,1024,7168,256,8,0,0,asm,13001+23000,13783.3974
gfx938,f8_w8a8_block,torch.float16,12288,1024,7168,256,8,0,0,asm,13001+23000,19406.7175
gfx938,f8_w8a8_block,torch.float16,16384,1024,7168,256,8,0,0,asm,13001+23000,25044.1644
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,256,8,0,0,asm,10002+20000,251.9628
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,256,8,0,0,asm,10006+20000,427.6089
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,256,8,0,0,asm,10001+20000,771.2179
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,256,8,0,0,asm,10001+20000,1070.6738
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,256,8,0,0,asm,10001+20000,1326.8262
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,256,8,0,0,asm,10001+20000,2202.1582
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,256,8,0,0,asm,10001+20000,3013.2885
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,256,8,0,0,asm,10001+20000,3641.0618
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,256,8,0,0,asm,10001+20000,4355.4914
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,256,8,0,0,asm,10001+20000,4593.266
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,256,8,0,0,asm,10001+20000,4767.8612
gfx938,f8_w8a8_block,torch.float16,68,2048,7168,256,8,0,0,asm,10001+20000,4860.9942
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,256,8,0,0,asm,10001+20000,4949.9584
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,256,8,0,0,asm,10001+20000,5088.8829
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,256,8,0,0,asm,11006+21000,5266.996
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,256,8,0,0,asm,10001+20000,5320.5549
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,256,8,0,0,asm,10001+20000,5308.1328
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,256,8,0,0,asm,10001+20000,5316.2476
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,256,8,0,0,asm,10001+20000,5450.785
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,256,8,0,0,asm,10001+20000,5529.5102
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,256,8,0,0,asm,10001+20000,5638.9213
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,256,8,0,0,asm,10001+20000,5691.9585
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,256,8,0,0,asm,10001+20000,5716.8708
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,256,8,0,0,asm,11010+21000,5836.1793
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,256,8,0,0,asm,11010+21000,5915.5616
gfx938,f8_w8a8_block,torch.float16,640,2048,7168,256,8,0,0,asm,11010+21000,5985.1953
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,256,8,0,0,asm,12003+22000,6111.1721
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,256,8,0,0,asm,12003+22000,6233.1449
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,256,8,0,0,asm,12003+22000,6516.6345
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,256,8,0,0,asm,12003+22000,8578.0631
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,256,8,0,0,asm,13001+23000,10717.5206
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,256,8,0,0,asm,12003+22000,14547.0352
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,256,8,0,0,asm,12003+22000,19927.8669
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,256,8,0,0,asm,13001+23000,21524.7389
gfx938,f8_w8a8_block,torch.float16,7680,2048,7168,256,8,0,0,asm,13001+23000,22661.5994
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,256,8,0,0,asm,13001+23000,25611.2774
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,256,8,0,0,asm,13001+23000,36065.8213
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,256,8,0,0,asm,13001+23000,46297.6444
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,288,8,0,0,asm,10006+20000,252.0489
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,288,8,0,0,asm,10006+20000,430.5957
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,288,8,0,0,asm,10002+20000,756.1026
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,288,8,0,0,asm,10001+20000,1069.1647
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,288,8,0,0,asm,10001+20000,1306.9971
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,288,8,0,0,asm,10001+20000,2284.3784
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,288,8,0,0,asm,10001+20000,3099.9363
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,288,8,0,0,asm,10001+20000,3767.9718
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,288,8,0,0,asm,10001+20000,4620.3121
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,288,8,0,0,asm,10001+20000,4939.5057
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,288,8,0,0,asm,10001+20000,5129.1815
gfx938,f8_w8a8_block,torch.float16,68,2048,7168,288,8,0,0,asm,10002+20000,5164.4877
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,288,8,0,0,asm,10001+20000,5308.4833
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,288,8,0,0,asm,10001+20000,5387.8599
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,288,8,0,0,asm,10001+20000,5502.0268
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,288,8,0,0,asm,10001+20000,5595.4265
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,288,8,0,0,asm,10001+20000,5631.7624
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,288,8,0,0,asm,10001+20000,5679.1349
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,288,8,0,0,asm,10001+20000,5931.2481
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,288,8,0,0,asm,10001+20000,6013.378
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,288,8,0,0,asm,10001+20000,6180.9942
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,288,8,0,0,asm,10001+20000,6371.7133
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,288,8,0,0,asm,10001+20000,6398.0948
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,288,8,0,0,asm,11010+21000,6508.5766
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,288,8,0,0,asm,11010+21000,6613.3309
gfx938,f8_w8a8_block,torch.float16,640,2048,7168,288,8,0,0,asm,11010+21000,6681.1973
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,288,8,0,0,asm,12003+22000,6787.456
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,288,8,0,0,asm,12003+22000,6932.4909
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,288,8,0,0,asm,12002+22000,7172.1113
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,288,8,0,0,asm,12003+22000,8085.1632
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,288,8,0,0,asm,13001+23000,11887.6732
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,288,8,0,0,asm,13001+23000,13355.7484
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,288,8,0,0,asm,12003+22000,19758.7502
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,288,8,0,0,asm,12003+22000,23482.3928
gfx938,f8_w8a8_block,torch.float16,7680,2048,7168,288,8,0,0,asm,13001+23000,23931.7054
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,288,8,0,0,asm,13001+23000,24374.1711
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,288,8,0,0,asm,13001+23000,34948.4318
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,288,8,0,0,asm,13001+23000,46757.3991
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,36,8,0,0,asm,10006+20000,242.5053
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,36,8,0,0,asm,10002+20000,379.8434
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,36,8,0,0,asm,10002+20000,568.874
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,36,8,0,0,asm,10002+20000,717.4164
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,36,8,0,0,asm,10002+20000,759.7488
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,36,8,0,0,asm,10002+20000,831.6938
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,36,8,0,0,asm,10001+20000,865.2568
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,36,8,0,0,asm,10002+20000,866.5272
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,36,8,0,0,asm,11010+21000,892.3441
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,36,8,0,0,asm,11010+21000,899.0294
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,36,8,0,0,asm,11010+21000,909.4108
gfx938,f8_w8a8_block,torch.float16,68,2048,7168,36,8,0,0,asm,11010+21000,907.7949
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,36,8,0,0,asm,11009+21000,984.5952
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,36,8,0,0,asm,11010+21000,906.8205
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,36,8,0,0,asm,11010+21000,913.0271
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,36,8,0,0,asm,11010+21000,910.8481
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,36,8,0,0,asm,11010+21000,914.0648
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,36,8,0,0,asm,11010+21000,916.0669
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,36,8,0,0,asm,11010+21000,944.7542
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,36,8,0,0,asm,12003+22000,981.2716
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,36,8,0,0,asm,12003+22000,976.5842
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,36,8,0,0,asm,12003+22000,1046.3545
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,36,8,0,0,asm,12003+22000,1117.3637
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,36,8,0,0,asm,13001+23000,1584.1359
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,36,8,0,0,asm,12003+22000,1730.4226
gfx938,f8_w8a8_block,torch.float16,640,2048,7168,36,8,0,0,asm,12003+22000,2364.2128
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,36,8,0,0,asm,12003+22000,2495.0365
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,36,8,0,0,asm,13001+23000,2967.159
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,36,8,0,0,asm,13001+23000,4397.4882
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,36,8,0,0,asm,13001+23000,5729.3881
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,36,8,0,0,asm,13001+23000,8545.7815
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,36,8,0,0,asm,13001+23000,11050.4888
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,36,8,0,0,asm,13001+23000,15905.5158
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,36,8,0,0,asm,13001+23000,18483.3557
gfx938,f8_w8a8_block,torch.float16,7680,2048,7168,36,8,0,0,asm,13001+23000,19818.6245
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,36,8,0,0,asm,13001+23000,21101.9132
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,36,8,0,0,asm,13001+23000,31240.5371
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,36,8,0,0,asm,13001+23000,41174.3595
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,18,8,0,0,asm,10006+20000,253.2057
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,18,8,0,0,asm,10006+20000,340.1796
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,18,8,0,0,asm,10001+20000,450.665
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,18,8,0,0,asm,10002+20000,451.4404
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,18,8,0,0,asm,10002+20000,471.0792
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,18,8,0,0,asm,10001+20000,478.6772
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,18,8,0,0,asm,11010+21000,501.0289
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,18,8,0,0,asm,11010+21000,498.9725
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,18,8,0,0,asm,11007+21000,517.3899
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,18,8,0,0,asm,11010+21000,520.8237
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,18,8,0,0,asm,12003+22000,542.7262
gfx938,f8_w8a8_block,torch.float16,68,2048,7168,18,8,0,0,asm,12003+22000,596.5075
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,18,8,0,0,asm,12001+22000,612.4255
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,18,8,0,0,asm,12003+22000,551.5192
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,18,8,0,0,asm,12003+22000,552.1879
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,18,8,0,0,asm,12003+22000,560.6104
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,18,8,0,0,asm,12003+22000,556.0361
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,18,8,0,0,asm,12003+22000,572.2411
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,18,8,0,0,asm,12003+22000,563.2689
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,18,8,0,0,asm,12003+22000,624.3464
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,18,8,0,0,asm,12003+22000,824.3752
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,18,8,0,0,asm,12003+22000,860.9125
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,18,8,0,0,asm,12003+22000,893.8342
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,18,8,0,0,asm,12003+22000,1281.9552
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,18,8,0,0,asm,13001+23000,1540.5314
gfx938,f8_w8a8_block,torch.float16,640,2048,7168,18,8,0,0,asm,12003+22000,2034.2148
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,18,8,0,0,asm,13001+23000,2212.7575
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,18,8,0,0,asm,13001+23000,2898.641
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,18,8,0,0,asm,13001+23000,4266.8676
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,18,8,0,0,asm,13001+23000,5588.6124
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,18,8,0,0,asm,13001+23000,7867.0413
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,18,8,0,0,asm,13001+23000,10511.3056
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,18,8,0,0,asm,13001+23000,15436.545
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,18,8,0,0,asm,13001+23000,17827.8971
gfx938,f8_w8a8_block,torch.float16,7680,2048,7168,18,8,0,0,asm,13001+23000,18981.7078
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,18,8,0,0,asm,13001+23000,20322.7869
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,18,8,0,0,asm,13001+23000,30253.3927
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,18,8,0,0,asm,13001+23000,40252.3459
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,12,8,0,0,asm,10002+20000,265.6776
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,12,8,0,0,asm,10001+20000,356.1058
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,12,8,0,0,asm,10002+20000,353.7674
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,12,8,0,0,asm,10006+20000,356.3274
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,12,8,0,0,asm,10001+20000,359.7653
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,12,8,0,0,asm,10001+20000,359.5027
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,12,8,0,0,asm,11009+21000,384.1683
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,12,8,0,0,asm,11010+21000,378.8381
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,12,8,0,0,asm,12003+22000,429.3415
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,12,8,0,0,asm,12003+22000,437.1896
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,12,8,0,0,asm,12003+22000,441.2582
gfx938,f8_w8a8_block,torch.float16,68,2048,7168,12,8,0,0,asm,12003+22000,486.6129
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,12,8,0,0,asm,12000+22000,498.7031
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,12,8,0,0,asm,12003+22000,449.5136
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,12,8,0,0,asm,12003+22000,450.486
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,12,8,0,0,asm,12003+22000,480.373
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,12,8,0,0,asm,12003+22000,486.3176
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,12,8,0,0,asm,12003+22000,583.1007
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,12,8,0,0,asm,12003+22000,625.4102
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,12,8,0,0,asm,12003+22000,643.3043
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,12,8,0,0,asm,12003+22000,649.7136
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,12,8,0,0,asm,12003+22000,861.5113
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,12,8,0,0,asm,12003+22000,879.8491
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,12,8,0,0,asm,12003+22000,1276.9704
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,12,8,0,0,asm,13001+23000,1580.5419
gfx938,f8_w8a8_block,torch.float16,640,2048,7168,12,8,0,0,asm,12003+22000,1933.2875
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,12,8,0,0,asm,13001+23000,2321.9867
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,12,8,0,0,asm,13001+23000,2891.5873
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,12,8,0,0,asm,13001+23000,4088.2241
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,12,8,0,0,asm,13001+23000,5294.1901
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,12,8,0,0,asm,13001+23000,7754.2657
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,12,8,0,0,asm,13001+23000,10316.9177
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,12,8,0,0,asm,13001+23000,15092.8758
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,12,8,0,0,asm,13001+23000,17581.5223
gfx938,f8_w8a8_block,torch.float16,7680,2048,7168,12,8,0,0,asm,13001+23000,18825.2402
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,12,8,0,0,asm,13001+23000,20077.4043
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,12,8,0,0,asm,13001+23000,29951.1569
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,12,8,0,0,asm,13001+23000,39756.4384
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,32,8,0,0,asm,10002+20000,260.7162
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,32,8,0,0,asm,10002+20000,409.1621
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,32,8,0,0,asm,10006+20000,556.5805
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,32,8,0,0,asm,10002+20000,717.0262
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,32,8,0,0,asm,10002+20000,718.2809
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,32,8,0,0,asm,10002+20000,788.2175
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,32,8,0,0,asm,10002+20000,836.5512
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,32,8,0,0,asm,10002+20000,829.7501
gfx938,f8_w8a8_block,torch.float16,36,2048,7168,32,8,0,0,asm,10002+20000,844.2227
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,32,8,0,0,asm,10006+20000,875.3385
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,32,8,0,0,asm,11007+21000,890.21
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,32,8,0,0,asm,11007+21000,891.0467
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,32,8,0,0,asm,11010+21000,906.4289
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,32,8,0,0,asm,11007+21000,891.9616
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,32,8,0,0,asm,11010+21000,897.7047
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,32,8,0,0,asm,11010+21000,895.4226
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,32,8,0,0,asm,11010+21000,900.5763
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,32,8,0,0,asm,11010+21000,905.6794
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,32,8,0,0,asm,11010+21000,912.9299
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,32,8,0,0,asm,12002+22000,971.4591
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,32,8,0,0,asm,12003+22000,968.2561
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,32,8,0,0,asm,12003+22000,1065.4767
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,32,8,0,0,asm,12003+22000,1180.9711
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,32,8,0,0,asm,13001+22000,1378.7978
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,32,8,0,0,asm,12005+22000,1771.5964
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,32,8,0,0,asm,12005+22000,2489.4297
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,32,8,0,0,asm,13001+23000,2843.6769
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,32,8,0,0,asm,13001+23000,4129.2134
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,32,8,0,0,asm,13001+23000,5286.1524
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,32,8,0,0,asm,13001+23000,7599.4159
gfx938,f8_w8a8_block,torch.float16,3584,2048,7168,32,8,0,0,asm,13001+23000,8879.8913
gfx938,f8_w8a8_block,torch.float16,3840,2048,7168,32,8,0,0,asm,13001+23000,9373.7589
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,32,8,0,0,asm,13001+23000,9922.2875
gfx938,f8_w8a8_block,torch.float16,5120,2048,7168,32,8,0,0,asm,13001+23000,12321.6558
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,32,8,0,0,asm,13001+23000,14637.0245
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,32,8,0,0,asm,13001+23000,17064.6537
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,32,8,0,0,asm,13001+23000,19372.8049
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,32,8,0,0,asm,13001+23000,28622.759
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,32,8,0,0,asm,13001+23000,37843.5938
gfx938,f8_w8a8_block,torch.float16,24576,2048,7168,32,8,0,0,asm,13001+23000,56428.1749
gfx938,f8_w8a8_block,torch.float16,32768,2048,7168,32,8,0,0,asm,13001+23000,75020.0322
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,16,8,0,0,asm,10002+20000,283.4024
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,16,8,0,0,asm,10002+20000,386.6779
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,16,8,0,0,asm,10002+20000,431.1746
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,16,8,0,0,asm,10002+20000,450.8883
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,16,8,0,0,asm,10002+20000,468.6651
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,16,8,0,0,asm,10006+20000,468.2018
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,16,8,0,0,asm,10002+20000,511.6092
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,16,8,0,0,asm,11010+21000,490.2902
gfx938,f8_w8a8_block,torch.float16,36,2048,7168,16,8,0,0,asm,11010+21000,500.5356
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,16,8,0,0,asm,11010+21000,516.4766
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,16,8,0,0,asm,11010+21000,518.5145
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,16,8,0,0,asm,12003+22001,568.0836
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,16,8,0,0,asm,12003+22002,599.7184
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,16,8,0,0,asm,12003+22000,545.9923
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,16,8,0,0,asm,12003+22000,577.1248
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,16,8,0,0,asm,12003+22000,548.5186
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,16,8,0,0,asm,12003+22000,582.6574
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,16,8,0,0,asm,12003+22000,554.8091
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,16,8,0,0,asm,12003+22000,588.729
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,16,8,0,0,asm,12003+22000,618.3487
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,16,8,0,0,asm,13001+22000,733.4864
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,16,8,0,0,asm,13001+22000,769.9915
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,16,8,0,0,asm,12005+22000,1012.8147
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,16,8,0,0,asm,12005+22000,1266.6075
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,16,8,0,0,asm,12005+22000,1651.9
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,16,8,0,0,asm,13001+22000,2209.8097
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,16,8,0,0,asm,13001+23000,2721.6816
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,16,8,0,0,asm,13001+23000,3930.9237
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,16,8,0,0,asm,13001+23000,5010.0442
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,16,8,0,0,asm,13001+23000,7328.1415
gfx938,f8_w8a8_block,torch.float16,3584,2048,7168,16,8,0,0,asm,13001+23000,8457.5269
gfx938,f8_w8a8_block,torch.float16,3840,2048,7168,16,8,0,0,asm,13001+23000,9092.6067
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,16,8,0,0,asm,13001+23000,9647.2743
gfx938,f8_w8a8_block,torch.float16,5120,2048,7168,16,8,0,0,asm,13001+23000,11924.7904
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,16,8,0,0,asm,13001+23000,14222.8628
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,16,8,0,0,asm,13001+23000,16384.8763
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,16,8,0,0,asm,13001+23000,18712.2948
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,16,8,0,0,asm,13001+23000,27952.4493
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,16,8,0,0,asm,13001+23000,36869.1837
gfx938,f8_w8a8_block,torch.float16,24576,2048,7168,16,8,0,0,asm,13001+23000,54914.6881
gfx938,f8_w8a8_block,torch.float16,32768,2048,7168,16,8,0,0,asm,13001+23000,72948.9094
gfx938,f8_w8a8_block,torch.float16,1,2048,7168,8,8,0,0,asm,10001+20000,267.6383
gfx938,f8_w8a8_block,torch.float16,2,2048,7168,8,8,0,0,asm,10006+20000,270.9898
gfx938,f8_w8a8_block,torch.float16,4,2048,7168,8,8,0,0,asm,10002+20000,270.8719
gfx938,f8_w8a8_block,torch.float16,6,2048,7168,8,8,0,0,asm,10002+20000,280.5899
gfx938,f8_w8a8_block,torch.float16,8,2048,7168,8,8,0,0,asm,10002+20000,283.0992
gfx938,f8_w8a8_block,torch.float16,16,2048,7168,8,8,0,0,asm,10002+20000,286.2066
gfx938,f8_w8a8_block,torch.float16,24,2048,7168,8,8,0,0,asm,11010+21000,303.6942
gfx938,f8_w8a8_block,torch.float16,32,2048,7168,8,8,0,0,asm,11010+21000,312.3455
gfx938,f8_w8a8_block,torch.float16,36,2048,7168,8,8,0,0,asm,12003+22000,317.6479
gfx938,f8_w8a8_block,torch.float16,48,2048,7168,8,8,0,0,asm,12003+22002,328.1404
gfx938,f8_w8a8_block,torch.float16,56,2048,7168,8,8,0,0,asm,12003+22000,353.4456
gfx938,f8_w8a8_block,torch.float16,64,2048,7168,8,8,0,0,asm,12003+22000,331.7981
gfx938,f8_w8a8_block,torch.float16,72,2048,7168,8,8,0,0,asm,13001+22000,456.1231
gfx938,f8_w8a8_block,torch.float16,80,2048,7168,8,8,0,0,asm,13001+22000,424.8726
gfx938,f8_w8a8_block,torch.float16,88,2048,7168,8,8,0,0,asm,13001+22000,431.4494
gfx938,f8_w8a8_block,torch.float16,90,2048,7168,8,8,0,0,asm,13001+22000,435.4494
gfx938,f8_w8a8_block,torch.float16,96,2048,7168,8,8,0,0,asm,13001+22000,441.8662
gfx938,f8_w8a8_block,torch.float16,100,2048,7168,8,8,0,0,asm,13001+22000,430.2873
gfx938,f8_w8a8_block,torch.float16,112,2048,7168,8,8,0,0,asm,13001+22000,446.6915
gfx938,f8_w8a8_block,torch.float16,128,2048,7168,8,8,0,0,asm,13001+22000,438.5177
gfx938,f8_w8a8_block,torch.float16,160,2048,7168,8,8,0,0,asm,12005+22000,614.5056
gfx938,f8_w8a8_block,torch.float16,224,2048,7168,8,8,0,0,asm,13001+22000,739.8105
gfx938,f8_w8a8_block,torch.float16,256,2048,7168,8,8,0,0,asm,13001+22000,744.9672
gfx938,f8_w8a8_block,torch.float16,384,2048,7168,8,8,0,0,asm,13001+22000,1087.3912
gfx938,f8_w8a8_block,torch.float16,512,2048,7168,8,8,0,0,asm,13001+22000,1391.6428
gfx938,f8_w8a8_block,torch.float16,768,2048,7168,8,8,0,0,asm,13001+23000,1964.0364
gfx938,f8_w8a8_block,torch.float16,1024,2048,7168,8,8,0,0,asm,13001+23000,2507.9386
gfx938,f8_w8a8_block,torch.float16,1536,2048,7168,8,8,0,0,asm,13001+23000,3636.7677
gfx938,f8_w8a8_block,torch.float16,2048,2048,7168,8,8,0,0,asm,13001+23000,4742.7426
gfx938,f8_w8a8_block,torch.float16,3072,2048,7168,8,8,0,0,asm,13001+23000,6988.6465
gfx938,f8_w8a8_block,torch.float16,3584,2048,7168,8,8,0,0,asm,13001+23000,8090.6961
gfx938,f8_w8a8_block,torch.float16,3840,2048,7168,8,8,0,0,asm,13001+23000,8696.184
gfx938,f8_w8a8_block,torch.float16,4096,2048,7168,8,8,0,0,asm,13001+23000,9192.0232
gfx938,f8_w8a8_block,torch.float16,5120,2048,7168,8,8,0,0,asm,13001+23000,11496.301
gfx938,f8_w8a8_block,torch.float16,6144,2048,7168,8,8,0,0,asm,13001+23000,13715.0042
gfx938,f8_w8a8_block,torch.float16,7168,2048,7168,8,8,0,0,asm,13001+23000,16126.7491
gfx938,f8_w8a8_block,torch.float16,8192,2048,7168,8,8,0,0,asm,13001+23000,18519.7223
gfx938,f8_w8a8_block,torch.float16,12288,2048,7168,8,8,0,0,asm,13001+23000,27498.3048
gfx938,f8_w8a8_block,torch.float16,16384,2048,7168,8,8,0,0,asm,13001+23000,36258.1284
gfx938,f8_w8a8_block,torch.float16,24576,2048,7168,8,8,0,0,asm,13001+23000,53518.8203
gfx938,f8_w8a8_block,torch.float16,32768,2048,7168,8,8,0,0,asm,13001+23000,71472.2139
gfx938,f8_w8a8_block,torch.float16,1,256,7168,257,9,0,0,asm,10007+20000,73.9463
gfx938,f8_w8a8_block,torch.float16,2,256,7168,257,9,0,0,asm,10002+20000,103.0494
gfx938,f8_w8a8_block,torch.float16,4,256,7168,257,9,0,0,asm,10002+20000,157.7439
gfx938,f8_w8a8_block,torch.float16,6,256,7168,257,9,0,0,asm,10002+20000,211.7985
gfx938,f8_w8a8_block,torch.float16,8,256,7168,257,9,0,0,asm,10006+20000,253.7856
gfx938,f8_w8a8_block,torch.float16,12,256,7168,257,9,0,0,asm,10002+20000,331.7222
gfx938,f8_w8a8_block,torch.float16,16,256,7168,257,9,0,0,asm,10002+20000,407.5114
gfx938,f8_w8a8_block,torch.float16,20,256,7168,257,9,0,0,asm,10005+20000,465.2345
gfx938,f8_w8a8_block,torch.float16,24,256,7168,257,9,0,0,asm,10002+20000,519.9458
gfx938,f8_w8a8_block,torch.float16,28,256,7168,257,9,0,0,asm,10002+20000,565.4308
gfx938,f8_w8a8_block,torch.float16,32,256,7168,257,9,0,0,asm,10006+20000,592.3696
gfx938,f8_w8a8_block,torch.float16,36,256,7168,257,9,0,0,asm,10001+20000,620.1476
gfx938,f8_w8a8_block,torch.float16,40,256,7168,257,9,0,0,asm,10002+20000,642.4296
gfx938,f8_w8a8_block,torch.float16,44,256,7168,257,9,0,0,asm,10002+20000,651.9706
gfx938,f8_w8a8_block,torch.float16,48,256,7168,257,9,0,0,asm,10002+20000,686.421
gfx938,f8_w8a8_block,torch.float16,56,256,7168,257,9,0,0,asm,10002+20000,736.5008
gfx938,f8_w8a8_block,torch.float16,64,256,7168,257,9,0,0,asm,10002+20000,745.9071
gfx938,f8_w8a8_block,torch.float16,72,256,7168,257,9,0,0,asm,10002+20000,776.5091
gfx938,f8_w8a8_block,torch.float16,80,256,7168,257,9,0,0,asm,10002+20000,793.5026
gfx938,f8_w8a8_block,torch.float16,96,256,7168,257,9,0,0,asm,10002+20000,817.8563
gfx938,f8_w8a8_block,torch.float16,104,256,7168,257,9,0,0,asm,10002+20000,822.9004
gfx938,f8_w8a8_block,torch.float16,112,256,7168,257,9,0,0,asm,10002+20000,826.3278
gfx938,f8_w8a8_block,torch.float16,128,256,7168,257,9,0,0,asm,10002+20000,835.1446
gfx938,f8_w8a8_block,torch.float16,144,256,7168,257,9,0,0,asm,10002+20000,848.1887
gfx938,f8_w8a8_block,torch.float16,160,256,7168,257,9,0,0,asm,10001+20000,853.1572
gfx938,f8_w8a8_block,torch.float16,192,256,7168,257,9,0,0,asm,10001+20000,864.9213
gfx938,f8_w8a8_block,torch.float16,224,256,7168,257,9,0,0,asm,10002+20000,872.4666
gfx938,f8_w8a8_block,torch.float16,256,256,7168,257,9,0,0,asm,10002+20000,891.0096
gfx938,f8_w8a8_block,torch.float16,320,256,7168,257,9,0,0,asm,10005+20000,922.6053
gfx938,f8_w8a8_block,torch.float16,384,256,7168,257,9,0,0,asm,10006+20000,963.8683
gfx938,f8_w8a8_block,torch.float16,448,256,7168,257,9,0,0,asm,11010+21000,981.4514
gfx938,f8_w8a8_block,torch.float16,512,256,7168,257,9,0,0,asm,11009+21000,1019.9692
gfx938,f8_w8a8_block,torch.float16,768,256,7168,257,9,0,0,asm,11010+21000,1092.5163
gfx938,f8_w8a8_block,torch.float16,896,256,7168,257,9,0,0,asm,11010+21000,1171.3539
gfx938,f8_w8a8_block,torch.float16,960,256,7168,257,9,0,0,asm,11010+21000,1275.7745
gfx938,f8_w8a8_block,torch.float16,1024,256,7168,257,9,0,0,asm,11010+21000,1363.8584
gfx938,f8_w8a8_block,torch.float16,1280,256,7168,257,9,0,0,asm,12003+22000,1408.9024
gfx938,f8_w8a8_block,torch.float16,1536,256,7168,257,9,0,0,asm,12003+22000,1494.5274
gfx938,f8_w8a8_block,torch.float16,1920,256,7168,257,9,0,0,asm,12005+22000,1886.1974
gfx938,f8_w8a8_block,torch.float16,2048,256,7168,257,9,0,0,asm,12006+22000,2027.5611
gfx938,f8_w8a8_block,torch.float16,2304,256,7168,257,9,0,0,asm,13001+23000,2184.8658
gfx938,f8_w8a8_block,torch.float16,2560,256,7168,257,9,0,0,asm,13001+23000,2272.7138
gfx938,f8_w8a8_block,torch.float16,3072,256,7168,257,9,0,0,asm,13001+23000,2400.5871
gfx938,f8_w8a8_block,torch.float16,3584,256,7168,257,9,0,0,asm,12005+22000,2762.3288
gfx938,f8_w8a8_block,torch.float16,3840,256,7168,257,9,0,0,asm,12005+22000,3116.4495
gfx938,f8_w8a8_block,torch.float16,4096,256,7168,257,9,0,0,asm,12005+22000,3296.3478
gfx938,f8_w8a8_block,torch.float16,4608,256,7168,257,9,0,0,asm,12005+22000,3493.6523
gfx938,f8_w8a8_block,torch.float16,5120,256,7168,257,9,0,0,asm,12005+22000,3704.4556
gfx938,f8_w8a8_block,torch.float16,6144,256,7168,257,9,0,0,asm,13001+23000,4279.6198
gfx938,f8_w8a8_block,torch.float16,7168,256,7168,257,9,0,0,asm,13001+23000,4927.3562
gfx938,f8_w8a8_block,torch.float16,8192,256,7168,257,9,0,0,asm,12005+22000,5789.3569
gfx938,f8_w8a8_block,torch.float16,10240,256,7168,257,9,0,0,asm,13001+23000,6638.1284
gfx938,f8_w8a8_block,torch.float16,12288,256,7168,257,9,0,0,asm,13001+23000,8305.4483
gfx938,f8_w8a8_block,torch.float16,16384,256,7168,257,9,0,0,asm,13001+23000,10449.6253
gfx938,f8_w8a8_block,torch.float16,24576,256,7168,257,9,0,0,asm,13001+23000,15201.8004
gfx938,f8_w8a8_block,torch.float16,32768,256,7168,257,9,0,0,asm,13001+23000,20098.0089
gfx938,f8_w8a8_block,torch.float16,1,256,6144,256,8,0,0,asm,10007+20000,67.6813
gfx938,f8_w8a8_block,torch.float16,2,256,6144,256,8,0,0,asm,10007+20000,93.7608
gfx938,f8_w8a8_block,torch.float16,4,256,6144,256,8,0,0,asm,10002+20000,138.3419
gfx938,f8_w8a8_block,torch.float16,6,256,6144,256,8,0,0,asm,10002+20000,179.6723
gfx938,f8_w8a8_block,torch.float16,8,256,6144,256,8,0,0,asm,10002+20000,217.9458
gfx938,f8_w8a8_block,torch.float16,12,256,6144,256,8,0,0,asm,10002+20000,275.4782
gfx938,f8_w8a8_block,torch.float16,16,256,6144,256,8,0,0,asm,10002+20000,321.9033
gfx938,f8_w8a8_block,torch.float16,20,256,6144,256,8,0,0,asm,10002+20000,370.4559
gfx938,f8_w8a8_block,torch.float16,24,256,6144,256,8,0,0,asm,10002+20000,413.7231
gfx938,f8_w8a8_block,torch.float16,28,256,6144,256,8,0,0,asm,10002+20000,470.2396
gfx938,f8_w8a8_block,torch.float16,32,256,6144,256,8,0,0,asm,10002+20000,494.3489
gfx938,f8_w8a8_block,torch.float16,36,256,6144,256,8,0,0,asm,10002+20000,514.7164
gfx938,f8_w8a8_block,torch.float16,40,256,6144,256,8,0,0,asm,10002+20000,535.8532
gfx938,f8_w8a8_block,torch.float16,44,256,6144,256,8,0,0,asm,10002+20000,549.3352
gfx938,f8_w8a8_block,torch.float16,48,256,6144,256,8,0,0,asm,10002+20000,566.0256
gfx938,f8_w8a8_block,torch.float16,56,256,6144,256,8,0,0,asm,10001+20000,595.3224
gfx938,f8_w8a8_block,torch.float16,64,256,6144,256,8,0,0,asm,10002+20000,617.7644
gfx938,f8_w8a8_block,torch.float16,72,256,6144,256,8,0,0,asm,10002+20000,634.5306
gfx938,f8_w8a8_block,torch.float16,80,256,6144,256,8,0,0,asm,10002+20000,651.9285
gfx938,f8_w8a8_block,torch.float16,96,256,6144,256,8,0,0,asm,10002+20000,682.6315
gfx938,f8_w8a8_block,torch.float16,104,256,6144,256,8,0,0,asm,10002+20000,688.2567
gfx938,f8_w8a8_block,torch.float16,112,256,6144,256,8,0,0,asm,10002+20000,698.4546
gfx938,f8_w8a8_block,torch.float16,128,256,6144,256,8,0,0,asm,10002+20000,712.0882
gfx938,f8_w8a8_block,torch.float16,144,256,6144,256,8,0,0,asm,10002+20000,718.6482
gfx938,f8_w8a8_block,torch.float16,160,256,6144,256,8,0,0,asm,10002+20000,730.6565
gfx938,f8_w8a8_block,torch.float16,192,256,6144,256,8,0,0,asm,10002+20000,739.8271
gfx938,f8_w8a8_block,torch.float16,224,256,6144,256,8,0,0,asm,10002+20000,741.7386
gfx938,f8_w8a8_block,torch.float16,256,256,6144,256,8,0,0,asm,10001+20000,754.8923
gfx938,f8_w8a8_block,torch.float16,320,256,6144,256,8,0,0,asm,10002+20000,770.9764
gfx938,f8_w8a8_block,torch.float16,384,256,6144,256,8,0,0,asm,10002+20000,800.1889
gfx938,f8_w8a8_block,torch.float16,448,256,6144,256,8,0,0,asm,11007+21000,836.1298
gfx938,f8_w8a8_block,torch.float16,512,256,6144,256,8,0,0,asm,11007+21000,857.3255
gfx938,f8_w8a8_block,torch.float16,768,256,6144,256,8,0,0,asm,11007+21000,932.2726
gfx938,f8_w8a8_block,torch.float16,896,256,6144,256,8,0,0,asm,11010+21000,956.6094
gfx938,f8_w8a8_block,torch.float16,960,256,6144,256,8,0,0,asm,11010+21000,1000.4997
gfx938,f8_w8a8_block,torch.float16,1024,256,6144,256,8,0,0,asm,11010+21000,1056.4489
gfx938,f8_w8a8_block,torch.float16,1280,256,6144,256,8,0,0,asm,12003+22000,1205.4336
gfx938,f8_w8a8_block,torch.float16,1536,256,6144,256,8,0,0,asm,12003+22000,1248.1451
gfx938,f8_w8a8_block,torch.float16,1920,256,6144,256,8,0,0,asm,12003+22000,1397.3318
gfx938,f8_w8a8_block,torch.float16,2048,256,6144,256,8,0,0,asm,12005+22000,1552.9186
gfx938,f8_w8a8_block,torch.float16,2304,256,6144,256,8,0,0,asm,12005+22000,1788.5303
gfx938,f8_w8a8_block,torch.float16,2560,256,6144,256,8,0,0,asm,12005+22000,1912.6982
gfx938,f8_w8a8_block,torch.float16,3072,256,6144,256,8,0,0,asm,13001+23000,2027.8051
gfx938,f8_w8a8_block,torch.float16,3584,256,6144,256,8,0,0,asm,12005+22000,2141.1773
gfx938,f8_w8a8_block,torch.float16,3840,256,6144,256,8,0,0,asm,12005+22000,2282.5494
gfx938,f8_w8a8_block,torch.float16,4096,256,6144,256,8,0,0,asm,12005+22000,2508.3084
gfx938,f8_w8a8_block,torch.float16,4608,256,6144,256,8,0,0,asm,12005+22000,2875.9616
gfx938,f8_w8a8_block,torch.float16,5120,256,6144,256,8,0,0,asm,12005+22000,3084.045
gfx938,f8_w8a8_block,torch.float16,6144,256,6144,256,8,0,0,asm,12005+22000,3509.3738
gfx938,f8_w8a8_block,torch.float16,7168,256,6144,256,8,0,0,asm,13001+23000,3791.5959
gfx938,f8_w8a8_block,torch.float16,8192,256,6144,256,8,0,0,asm,13001+23000,4491.9889
gfx938,f8_w8a8_block,torch.float16,10240,256,6144,256,8,0,0,asm,13001+23000,5509.2227
gfx938,f8_w8a8_block,torch.float16,12288,256,6144,256,8,0,0,asm,13001+23000,6313.4469
gfx938,f8_w8a8_block,torch.float16,16384,256,6144,256,8,0,0,asm,13001+23000,8165.8268
gfx938,f8_w8a8_block,torch.float16,24576,256,6144,256,8,0,0,asm,13001+23000,11880.1362
gfx938,f8_w8a8_block,torch.float16,32768,256,6144,256,8,0,0,asm,13001+23000,15682.8069
gfx938,f8_w8a8_block,torch.float16,1,256,6144,257,9,0,0,asm,10007+20000,70.5191
gfx938,f8_w8a8_block,torch.float16,2,256,6144,257,9,0,0,asm,10007+20000,98.4684
gfx938,f8_w8a8_block,torch.float16,4,256,6144,257,9,0,0,asm,10002+20000,148.6071
gfx938,f8_w8a8_block,torch.float16,6,256,6144,257,9,0,0,asm,10002+20000,191.8575
gfx938,f8_w8a8_block,torch.float16,8,256,6144,257,9,0,0,asm,10002+20000,232.4299
gfx938,f8_w8a8_block,torch.float16,12,256,6144,257,9,0,0,asm,10001+20000,301.6255
gfx938,f8_w8a8_block,torch.float16,16,256,6144,257,9,0,0,asm,10002+20000,361.3053
gfx938,f8_w8a8_block,torch.float16,20,256,6144,257,9,0,0,asm,10002+20000,407.3989
gfx938,f8_w8a8_block,torch.float16,24,256,6144,257,9,0,0,asm,10002+20000,454.4134
gfx938,f8_w8a8_block,torch.float16,28,256,6144,257,9,0,0,asm,10002+20000,497.0436
gfx938,f8_w8a8_block,torch.float16,32,256,6144,257,9,0,0,asm,10002+20000,519.1488
gfx938,f8_w8a8_block,torch.float16,36,256,6144,257,9,0,0,asm,10002+20000,533.7563
gfx938,f8_w8a8_block,torch.float16,40,256,6144,257,9,0,0,asm,10002+20000,555.2046
gfx938,f8_w8a8_block,torch.float16,44,256,6144,257,9,0,0,asm,10002+20000,563.3562
gfx938,f8_w8a8_block,torch.float16,48,256,6144,257,9,0,0,asm,10002+20000,592.3582
gfx938,f8_w8a8_block,torch.float16,56,256,6144,257,9,0,0,asm,10002+20000,634.9769
gfx938,f8_w8a8_block,torch.float16,64,256,6144,257,9,0,0,asm,10002+20000,648.5771
gfx938,f8_w8a8_block,torch.float16,72,256,6144,257,9,0,0,asm,10002+20000,663.4401
gfx938,f8_w8a8_block,torch.float16,80,256,6144,257,9,0,0,asm,10002+20000,680.9811
gfx938,f8_w8a8_block,torch.float16,96,256,6144,257,9,0,0,asm,10001+20000,700.9809
gfx938,f8_w8a8_block,torch.float16,104,256,6144,257,9,0,0,asm,10002+20000,713.1156
gfx938,f8_w8a8_block,torch.float16,112,256,6144,257,9,0,0,asm,10002+20000,717.2166
gfx938,f8_w8a8_block,torch.float16,128,256,6144,257,9,0,0,asm,10001+20000,723.4987
gfx938,f8_w8a8_block,torch.float16,144,256,6144,257,9,0,0,asm,10002+20000,724.9219
gfx938,f8_w8a8_block,torch.float16,160,256,6144,257,9,0,0,asm,10002+20000,737.0734
gfx938,f8_w8a8_block,torch.float16,192,256,6144,257,9,0,0,asm,10001+20000,742.9428
gfx938,f8_w8a8_block,torch.float16,224,256,6144,257,9,0,0,asm,10001+20000,754.3533
gfx938,f8_w8a8_block,torch.float16,256,256,6144,257,9,0,0,asm,10002+20000,768.6522
gfx938,f8_w8a8_block,torch.float16,320,256,6144,257,9,0,0,asm,10002+20000,791.4058
gfx938,f8_w8a8_block,torch.float16,384,256,6144,257,9,0,0,asm,10006+20000,832.4583
gfx938,f8_w8a8_block,torch.float16,448,256,6144,257,9,0,0,asm,11007+21000,848.6097
gfx938,f8_w8a8_block,torch.float16,512,256,6144,257,9,0,0,asm,11010+21000,878.3359
gfx938,f8_w8a8_block,torch.float16,768,256,6144,257,9,0,0,asm,11010+21000,943.6241
gfx938,f8_w8a8_block,torch.float16,896,256,6144,257,9,0,0,asm,11009+21000,1048.4237
gfx938,f8_w8a8_block,torch.float16,960,256,6144,257,9,0,0,asm,11010+21000,1100.1456
gfx938,f8_w8a8_block,torch.float16,1024,256,6144,257,9,0,0,asm,11010+21000,1152.9031
gfx938,f8_w8a8_block,torch.float16,1280,256,6144,257,9,0,0,asm,12003+22000,1223.6062
gfx938,f8_w8a8_block,torch.float16,1536,256,6144,257,9,0,0,asm,12002+22000,1305.5679
gfx938,f8_w8a8_block,torch.float16,1920,256,6144,257,9,0,0,asm,12005+22000,1656.2444
gfx938,f8_w8a8_block,torch.float16,2048,256,6144,257,9,0,0,asm,12005+22000,1770.1303
gfx938,f8_w8a8_block,torch.float16,2304,256,6144,257,9,0,0,asm,13001+23000,1911.9824
gfx938,f8_w8a8_block,torch.float16,2560,256,6144,257,9,0,0,asm,13001+23000,1980.1926
gfx938,f8_w8a8_block,torch.float16,3072,256,6144,257,9,0,0,asm,13001+23000,2101.4216
gfx938,f8_w8a8_block,torch.float16,3584,256,6144,257,9,0,0,asm,12005+22000,2446.9782
gfx938,f8_w8a8_block,torch.float16,3840,256,6144,257,9,0,0,asm,12005+22000,2696.7961
gfx938,f8_w8a8_block,torch.float16,4096,256,6144,257,9,0,0,asm,12005+22000,2876.2059
gfx938,f8_w8a8_block,torch.float16,4608,256,6144,257,9,0,0,asm,12005+22000,3061.4851
gfx938,f8_w8a8_block,torch.float16,5120,256,6144,257,9,0,0,asm,12005+22000,3218.2929
gfx938,f8_w8a8_block,torch.float16,6144,256,6144,257,9,0,0,asm,13001+23000,3724.1098
gfx938,f8_w8a8_block,torch.float16,7168,256,6144,257,9,0,0,asm,13001+23000,4285.598
gfx938,f8_w8a8_block,torch.float16,8192,256,6144,257,9,0,0,asm,12005+22000,5012.2561
gfx938,f8_w8a8_block,torch.float16,10240,256,6144,257,9,0,0,asm,13001+23000,5764.6995
gfx938,f8_w8a8_block,torch.float16,12288,256,6144,257,9,0,0,asm,13001+23000,7196.6686
gfx938,f8_w8a8_block,torch.float16,16384,256,6144,257,9,0,0,asm,13001+23000,9152.8711
gfx938,f8_w8a8_block,torch.float16,24576,256,6144,257,9,0,0,asm,13001+23000,13116.0298
gfx938,f8_w8a8_block,torch.float16,32768,256,6144,257,9,0,0,asm,13001+23000,17301.5285
gfx938,f8_w8a8_block,torch.float16,1,384,3072,256,8,0,0,asm,10001+20000,65.795
gfx938,f8_w8a8_block,torch.float16,2,384,3072,256,8,0,0,asm,10006+20000,83.7907
gfx938,f8_w8a8_block,torch.float16,4,384,3072,256,8,0,0,asm,10002+20000,125.6179
gfx938,f8_w8a8_block,torch.float16,6,384,3072,256,8,0,0,asm,10006+20000,149.9967
gfx938,f8_w8a8_block,torch.float16,8,384,3072,256,8,0,0,asm,10002+20000,176.7839
gfx938,f8_w8a8_block,torch.float16,12,384,3072,256,8,0,0,asm,10002+20000,227.4028
gfx938,f8_w8a8_block,torch.float16,16,384,3072,256,8,0,0,asm,10002+20000,264.9185
gfx938,f8_w8a8_block,torch.float16,20,384,3072,256,8,0,0,asm,10002+20000,300.1154
gfx938,f8_w8a8_block,torch.float16,24,384,3072,256,8,0,0,asm,10002+20000,335.7783
gfx938,f8_w8a8_block,torch.float16,28,384,3072,256,8,0,0,asm,10002+20000,378.2906
gfx938,f8_w8a8_block,torch.float16,32,384,3072,256,8,0,0,asm,10002+20000,399.1411
gfx938,f8_w8a8_block,torch.float16,36,384,3072,256,8,0,0,asm,10002+20000,410.4643
gfx938,f8_w8a8_block,torch.float16,40,384,3072,256,8,0,0,asm,10002+20000,426.2791
gfx938,f8_w8a8_block,torch.float16,44,384,3072,256,8,0,0,asm,10002+20000,445.6137
gfx938,f8_w8a8_block,torch.float16,48,384,3072,256,8,0,0,asm,10002+20000,451.6853
gfx938,f8_w8a8_block,torch.float16,56,384,3072,256,8,0,0,asm,10001+20000,474.1946
gfx938,f8_w8a8_block,torch.float16,64,384,3072,256,8,0,0,asm,10002+20000,492.3841
gfx938,f8_w8a8_block,torch.float16,72,384,3072,256,8,0,0,asm,10002+20000,506.1860
gfx938,f8_w8a8_block,torch.float16,80,384,3072,256,8,0,0,asm,10002+20000,516.9145
gfx938,f8_w8a8_block,torch.float16,96,384,3072,256,8,0,0,asm,10002+20000,535.4744
gfx938,f8_w8a8_block,torch.float16,104,384,3072,256,8,0,0,asm,10002+20000,542.3038
gfx938,f8_w8a8_block,torch.float16,112,384,3072,256,8,0,0,asm,10002+20000,545.5796
gfx938,f8_w8a8_block,torch.float16,128,384,3072,256,8,0,0,asm,10001+20000,558.7754
gfx938,f8_w8a8_block,torch.float16,144,384,3072,256,8,0,0,asm,10002+20000,564.8554
gfx938,f8_w8a8_block,torch.float16,160,384,3072,256,8,0,0,asm,10002+20000,564.2491
gfx938,f8_w8a8_block,torch.float16,192,384,3072,256,8,0,0,asm,10001+20000,573.4617
gfx938,f8_w8a8_block,torch.float16,224,384,3072,256,8,0,0,asm,10002+20000,579.6174
gfx938,f8_w8a8_block,torch.float16,256,384,3072,256,8,0,0,asm,10002+20000,583.6848
gfx938,f8_w8a8_block,torch.float16,320,384,3072,256,8,0,0,asm,10002+20000,595.5837
gfx938,f8_w8a8_block,torch.float16,384,384,3072,256,8,0,0,asm,10006+20000,619.592
gfx938,f8_w8a8_block,torch.float16,448,384,3072,256,8,0,0,asm,11010+21000,628.4425
gfx938,f8_w8a8_block,torch.float16,512,384,3072,256,8,0,0,asm,11010+21000,641.6214
gfx938,f8_w8a8_block,torch.float16,768,384,3072,256,8,0,0,asm,11010+21000,721.0822
gfx938,f8_w8a8_block,torch.float16,896,384,3072,256,8,0,0,asm,11010+21000,708.9475
gfx938,f8_w8a8_block,torch.float16,960,384,3072,256,8,0,0,asm,11010+21000,746.0674
gfx938,f8_w8a8_block,torch.float16,1024,384,3072,256,8,0,0,asm,11010+21000,774.5641
gfx938,f8_w8a8_block,torch.float16,1280,384,3072,256,8,0,0,asm,12003+22000,845.0818
gfx938,f8_w8a8_block,torch.float16,1536,384,3072,256,8,0,0,asm,12003+22000,916.7026
gfx938,f8_w8a8_block,torch.float16,1920,384,3072,256,8,0,0,asm,12003+22000,998.3023
gfx938,f8_w8a8_block,torch.float16,2048,384,3072,256,8,0,0,asm,12005+22000,1088.9209
gfx938,f8_w8a8_block,torch.float16,2304,384,3072,256,8,0,0,asm,12005+22000,1274.0655
gfx938,f8_w8a8_block,torch.float16,2560,384,3072,256,8,0,0,asm,13001+22000,1351.3958
gfx938,f8_w8a8_block,torch.float16,3072,384,3072,256,8,0,0,asm,13001+22000,1402.7135
gfx938,f8_w8a8_block,torch.float16,3584,384,3072,256,8,0,0,asm,12005+22000,1488.7932
gfx938,f8_w8a8_block,torch.float16,3840,384,3072,256,8,0,0,asm,12005+22000,1584.9023
gfx938,f8_w8a8_block,torch.float16,4096,384,3072,256,8,0,0,asm,12005+22000,1764.2532
gfx938,f8_w8a8_block,torch.float16,4608,384,3072,256,8,0,0,asm,12005+22000,1992.3282
gfx938,f8_w8a8_block,torch.float16,5120,384,3072,256,8,0,0,asm,12005+22000,2099.8142
gfx938,f8_w8a8_block,torch.float16,6144,384,3072,256,8,0,0,asm,12005+22000,2443.4087
gfx938,f8_w8a8_block,torch.float16,7168,384,3072,256,8,0,0,asm,13001+23000,2574.2547
gfx938,f8_w8a8_block,torch.float16,8192,384,3072,256,8,0,0,asm,13001+23000,3029.9331
gfx938,f8_w8a8_block,torch.float16,10240,384,3072,256,8,0,0,asm,13001+23000,3706.9581
gfx938,f8_w8a8_block,torch.float16,12288,384,3072,256,8,0,0,asm,13001+23000,4301.5159
gfx938,f8_w8a8_block,torch.float16,16384,384,3072,256,8,0,0,asm,13001+23000,5563.0188
gfx938,f8_w8a8_block,torch.float16,24576,384,3072,256,8,0,0,asm,13001+23000,7960.9725
gfx938,f8_w8a8_block,torch.float16,32768,384,3072,256,8,0,0,asm,13001+23000,10497.4939
gfx938,f8_w8a8_block,torch.float16,1,1536,3072,64,8,0,0,asm,10002+20000,118.2831
gfx938,f8_w8a8_block,torch.float16,2,1536,3072,64,8,0,0,asm,10002+20000,172.9438
gfx938,f8_w8a8_block,torch.float16,4,1536,3072,64,8,0,0,asm,10006+20000,280.0004
gfx938,f8_w8a8_block,torch.float16,6,1536,3072,64,8,0,0,asm,10002+20000,357.1707
gfx938,f8_w8a8_block,torch.float16,8,1536,3072,64,8,0,0,asm,10001+20000,381.2043
gfx938,f8_w8a8_block,torch.float16,12,1536,3072,64,8,0,0,asm,10002+20000,445.6251
gfx938,f8_w8a8_block,torch.float16,16,1536,3072,64,8,0,0,asm,10002+20000,485.1029
gfx938,f8_w8a8_block,torch.float16,20,1536,3072,64,8,0,0,asm,10002+20000,520.2745
gfx938,f8_w8a8_block,torch.float16,24,1536,3072,64,8,0,0,asm,10002+20000,528.2071
gfx938,f8_w8a8_block,torch.float16,28,1536,3072,64,8,0,0,asm,10002+20000,544.5385
gfx938,f8_w8a8_block,torch.float16,32,1536,3072,64,8,0,0,asm,10002+20000,549.3889
gfx938,f8_w8a8_block,torch.float16,36,1536,3072,64,8,0,0,asm,10002+20000,557.2091
gfx938,f8_w8a8_block,torch.float16,40,1536,3072,64,8,0,0,asm,10002+20000,559.5248
gfx938,f8_w8a8_block,torch.float16,44,1536,3072,64,8,0,0,asm,10002+20000,568.5774
gfx938,f8_w8a8_block,torch.float16,48,1536,3072,64,8,0,0,asm,10002+20000,576.7458
gfx938,f8_w8a8_block,torch.float16,56,1536,3072,64,8,0,0,asm,10002+20000,580.5437
gfx938,f8_w8a8_block,torch.float16,64,1536,3072,64,8,0,0,asm,10002+20000,581.052
gfx938,f8_w8a8_block,torch.float16,72,1536,3072,64,8,0,0,asm,10002+20000,576.6869
gfx938,f8_w8a8_block,torch.float16,80,1536,3072,64,8,0,0,asm,10001+20000,583.9037
gfx938,f8_w8a8_block,torch.float16,96,1536,3072,64,8,0,0,asm,11008+21000,643.0025
gfx938,f8_w8a8_block,torch.float16,104,1536,3072,64,8,0,0,asm,11010+21000,603.3142
gfx938,f8_w8a8_block,torch.float16,112,1536,3072,64,8,0,0,asm,11010+21000,604.4005
gfx938,f8_w8a8_block,torch.float16,128,1536,3072,64,8,0,0,asm,11010+21000,621.9529
gfx938,f8_w8a8_block,torch.float16,144,1536,3072,64,8,0,0,asm,11010+21000,617.4194
gfx938,f8_w8a8_block,torch.float16,160,1536,3072,64,8,0,0,asm,11010+21000,619.9457
gfx938,f8_w8a8_block,torch.float16,192,1536,3072,64,8,0,0,asm,11009+21000,677.4613
gfx938,f8_w8a8_block,torch.float16,224,1536,3072,64,8,0,0,asm,11010+21000,660.3666
gfx938,f8_w8a8_block,torch.float16,256,1536,3072,64,8,0,0,asm,12003+22000,682.2528
gfx938,f8_w8a8_block,torch.float16,320,1536,3072,64,8,0,0,asm,12003+22000,685.7728
gfx938,f8_w8a8_block,torch.float16,384,1536,3072,64,8,0,0,asm,12002+22000,710.6569
gfx938,f8_w8a8_block,torch.float16,448,1536,3072,64,8,0,0,asm,12003+22000,729.0737
gfx938,f8_w8a8_block,torch.float16,512,1536,3072,64,8,0,0,asm,12003+22000,880.7616
gfx938,f8_w8a8_block,torch.float16,768,1536,3072,64,8,0,0,asm,13001+22000,996.9717
gfx938,f8_w8a8_block,torch.float16,896,1536,3072,64,8,0,0,asm,13001+22000,1021.9148
gfx938,f8_w8a8_block,torch.float16,960,1536,3072,64,8,0,0,asm,13001+22000,1146.7902
gfx938,f8_w8a8_block,torch.float16,1024,1536,3072,64,8,0,0,asm,12005+22000,1338.7137
gfx938,f8_w8a8_block,torch.float16,1280,1536,3072,64,8,0,0,asm,12005+22000,1541.1298
gfx938,f8_w8a8_block,torch.float16,1536,1536,3072,64,8,0,0,asm,12005+22000,1845.1709
gfx938,f8_w8a8_block,torch.float16,1920,1536,3072,64,8,0,0,asm,13001+22000,1981.4062
gfx938,f8_w8a8_block,torch.float16,2048,1536,3072,64,8,0,0,asm,13001+23000,2225.9443
gfx938,f8_w8a8_block,torch.float16,2304,1536,3072,64,8,0,0,asm,12005+22000,2547.0715
gfx938,f8_w8a8_block,torch.float16,2560,1536,3072,64,8,0,0,asm,13001+23000,2643.6354
gfx938,f8_w8a8_block,torch.float16,3072,1536,3072,64,8,0,0,asm,13001+23000,3097.7981
gfx938,f8_w8a8_block,torch.float16,3584,1536,3072,64,8,0,0,asm,13001+23000,3522.9755
gfx938,f8_w8a8_block,torch.float16,3840,1536,3072,64,8,0,0,asm,13001+23000,3585.7374
gfx938,f8_w8a8_block,torch.float16,4096,1536,3072,64,8,0,0,asm,13001+23000,3955.6814
gfx938,f8_w8a8_block,torch.float16,4608,1536,3072,64,8,0,0,asm,13001+23000,4386.8714
gfx938,f8_w8a8_block,torch.float16,5120,1536,3072,64,8,0,0,asm,13001+23000,4794.1458
gfx938,f8_w8a8_block,torch.float16,6144,1536,3072,64,8,0,0,asm,13001+23000,5649.5617
gfx938,f8_w8a8_block,torch.float16,7168,1536,3072,64,8,0,0,asm,13001+23000,6510.7629
gfx938,f8_w8a8_block,torch.float16,8192,1536,3072,64,8,0,0,asm,13001+23000,7415.2649
gfx938,f8_w8a8_block,torch.float16,10240,1536,3072,64,8,0,0,asm,13001+23000,9181.1704
gfx938,f8_w8a8_block,torch.float16,12288,1536,3072,64,8,0,0,asm,13001+23000,10876.1201
gfx938,f8_w8a8_block,torch.float16,16384,1536,3072,64,8,0,0,asm,13001+23000,14314.7352
gfx938,f8_w8a8_block,torch.float16,24576,1536,3072,64,8,0,0,asm,13001+23000,21336.6809
gfx938,f8_w8a8_block,torch.float16,32768,1536,3072,64,8,0,0,asm,13001+23000,28266.1463
quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k,sol_type,sol_id,time_us
no_quant,torch.float16,1,256,8192,256,4,0,0,ck,576,309.8021428571405
no_quant,torch.float16,8,256,8192,256,4,0,0,ck,576,364.40785714285965
no_quant,torch.float16,16,256,8192,256,4,0,0,ck,576,705.001571428565
no_quant,torch.float16,24,256,8192,256,4,0,0,ck,272,1028.2664285714334
no_quant,torch.float16,32,256,8192,256,4,0,0,ck,576,1293.2290000000055
no_quant,torch.float16,48,256,8192,256,4,0,0,ck,272,1877.2707142857207
no_quant,torch.float16,64,256,8192,256,4,0,0,ck,576,2193.247142857142
no_quant,torch.float16,96,256,8192,256,4,0,0,ck,272,2471.966714285715
no_quant,torch.float16,128,256,8192,256,4,0,0,ck,576,2724.7889999999948
no_quant,torch.float16,256,256,8192,256,4,0,0,ck,576,3391.9192857142875
no_quant,torch.float16,512,256,8192,256,4,0,0,ck,576,3537.358999999999
no_quant,torch.float16,1024,256,8192,256,4,0,0,ck,272,5022.04200000001
no_quant,torch.float16,2048,256,8192,256,4,0,0,ck,272,6217.148285714277
no_quant,torch.float16,4096,256,8192,256,4,0,0,ck,272,8764.503571428571
no_quant,torch.float16,8192,256,8192,256,4,0,0,ck,272,16520.489142857128
no_quant,torch.float16,1,256,7168,256,8,0,0,ck,576,274.4422857142844
no_quant,torch.float16,8,256,7168,256,8,0,0,ck,576,584.9560000000014
no_quant,torch.float16,16,256,7168,256,8,0,0,ck,576,1056.360857142859
no_quant,torch.float16,24,256,7168,256,8,0,0,ck,576,1480.196999999999
no_quant,torch.float16,32,256,7168,256,8,0,0,ck,576,1867.970714285712
no_quant,torch.float16,48,256,7168,256,8,0,0,ck,576,2312.378428571425
no_quant,torch.float16,64,256,7168,256,8,0,0,ck,576,2382.001142857145
no_quant,torch.float16,96,256,7168,256,8,0,0,ck,576,2795.691714285705
no_quant,torch.float16,128,256,7168,256,8,0,0,ck,576,2820.2631428571426
no_quant,torch.float16,256,256,7168,256,8,0,0,ck,576,3055.348428571423
no_quant,torch.float16,512,256,7168,256,8,0,0,ck,272,4095.392285714287
no_quant,torch.float16,1024,256,7168,256,8,0,0,ck,272,5514.589714285707
no_quant,torch.float16,2048,256,7168,256,8,0,0,ck,272,7718.288428571438
no_quant,torch.float16,4096,256,7168,256,8,0,0,ck,272,14435.327142857148
no_quant,torch.float16,8192,256,7168,256,8,0,0,ck,272,27850.411142857163
M,N,K,bias,dtype,outdtype,scaleAB,libtype,solidx,soltimes,kernelName
token,model_dim,inter_dim,expert,topk,act_type,dtype,q_dtype_a,q_dtype_w,q_type,use_g1u1,doweight_stage1
256,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_128x128,1,0
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Tensor,1,0
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Token,1,0
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0
512,6144,4096,8,2,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.int4,QuantType.per_Tensor,1,0
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Tensor,1,0
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.int8,torch.int8,QuantType.per_Token,1,0
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0
512,6144,4096,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.int4,QuantType.per_Tensor,1,0
4,2304,1536,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0
4,2304,1536,8,2,ActivationType.Gelu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,1
\ No newline at end of file
quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k
int4_w4a16,torch.float16,1,256,7168,256,8,0,0
int4_w4a16,torch.float16,2,256,7168,256,8,0,0
int4_w4a16,torch.float16,4,256,7168,256,8,0,0
int4_w4a16,torch.float16,6,256,7168,256,8,0,0
int4_w4a16,torch.float16,8,256,7168,256,8,0,0
int4_w4a16,torch.float16,10,256,7168,256,8,0,0
int4_w4a16,torch.float16,12,256,7168,256,8,0,0
int4_w4a16,torch.float16,14,256,7168,256,8,0,0
int4_w4a16,torch.float16,16,256,7168,256,8,0,0
int4_w4a16,torch.float16,20,256,7168,256,8,0,0
int4_w4a16,torch.float16,24,256,7168,256,8,0,0
int4_w4a16,torch.float16,28,256,7168,256,8,0,0
int4_w4a16,torch.float16,32,256,7168,256,8,0,0
int4_w4a16,torch.float16,36,256,7168,256,8,0,0
int4_w4a16,torch.float16,40,256,7168,256,8,0,0
int4_w4a16,torch.float16,44,256,7168,256,8,0,0
int4_w4a16,torch.float16,48,256,7168,256,8,0,0
int4_w4a16,torch.float16,56,256,7168,256,8,0,0
int4_w4a16,torch.float16,64,256,7168,256,8,0,0
int4_w4a16,torch.float16,80,256,7168,256,8,0,0
int4_w4a16,torch.float16,96,256,7168,256,8,0,0
int4_w4a16,torch.float16,112,256,7168,256,8,0,0
int4_w4a16,torch.float16,128,256,7168,256,8,0,0
int4_w4a16,torch.float16,160,256,7168,256,8,0,0
int4_w4a16,torch.float16,192,256,7168,256,8,0,0
int4_w4a16,torch.float16,224,256,7168,256,8,0,0
int4_w4a16,torch.float16,256,256,7168,256,8,0,0
int4_w4a16,torch.float16,320,256,7168,256,8,0,0
int4_w4a16,torch.float16,384,256,7168,256,8,0,0
int4_w4a16,torch.float16,448,256,7168,256,8,0,0
int4_w4a16,torch.float16,512,256,7168,256,8,0,0
int4_w4a16,torch.float16,576,256,7168,256,8,0,0
int4_w4a16,torch.float16,640,256,7168,256,8,0,0
int4_w4a16,torch.float16,704,256,7168,256,8,0,0
int4_w4a16,torch.float16,768,256,7168,256,8,0,0
int4_w4a16,torch.float16,832,256,7168,256,8,0,0
int4_w4a16,torch.float16,896,256,7168,256,8,0,0
int4_w4a16,torch.float16,960,256,7168,256,8,0,0
int4_w4a16,torch.float16,1024,256,7168,256,8,0,0
int4_w4a16,torch.float16,1152,256,7168,256,8,0,0
int4_w4a16,torch.float16,1280,256,7168,256,8,0,0
int4_w4a16,torch.float16,1408,256,7168,256,8,0,0
int4_w4a16,torch.float16,1536,256,7168,256,8,0,0
int4_w4a16,torch.float16,1664,256,7168,256,8,0,0
int4_w4a16,torch.float16,1792,256,7168,256,8,0,0
int4_w4a16,torch.float16,1920,256,7168,256,8,0,0
int4_w4a16,torch.float16,2048,256,7168,256,8,0,0
int4_w4a16,torch.float16,2304,256,7168,256,8,0,0
int4_w4a16,torch.float16,2560,256,7168,256,8,0,0
int4_w4a16,torch.float16,2816,256,7168,256,8,0,0
int4_w4a16,torch.float16,3072,256,7168,256,8,0,0
int4_w4a16,torch.float16,3328,256,7168,256,8,0,0
int4_w4a16,torch.float16,3584,256,7168,256,8,0,0
int4_w4a16,torch.float16,3840,256,7168,256,8,0,0
int4_w4a16,torch.float16,4096,256,7168,256,8,0,0
int4_w4a16,torch.float16,4608,256,7168,256,8,0,0
int4_w4a16,torch.float16,5120,256,7168,256,8,0,0
int4_w4a16,torch.float16,5632,256,7168,256,8,0,0
int4_w4a16,torch.float16,6144,256,7168,256,8,0,0
int4_w4a16,torch.float16,6656,256,7168,256,8,0,0
int4_w4a16,torch.float16,7168,256,7168,256,8,0,0
int4_w4a16,torch.float16,7680,256,7168,256,8,0,0
int4_w4a16,torch.float16,8192,256,7168,256,8,0,0
int4_w4a16,torch.float16,10240,256,7168,256,8,0,0
int4_w4a16,torch.float16,12288,256,7168,256,8,0,0
int4_w4a16,torch.float16,14336,256,7168,256,8,0,0
int4_w4a16,torch.float16,16384,256,7168,256,8,0,0
int4_w4a16,torch.float16,17408,256,7168,256,8,0,0
int4_w4a16,torch.float16,24576,256,7168,256,8,0,0
int4_w4a16,torch.float16,32768,256,7168,256,8,0,0
\ No newline at end of file
quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k
int4_w4a8,torch.float16,1,256,7168,256,8,0,0
int4_w4a8,torch.float16,2,256,7168,256,8,0,0
int4_w4a8,torch.float16,4,256,7168,256,8,0,0
int4_w4a8,torch.float16,6,256,7168,256,8,0,0
int4_w4a8,torch.float16,8,256,7168,256,8,0,0
int4_w4a8,torch.float16,10,256,7168,256,8,0,0
int4_w4a8,torch.float16,12,256,7168,256,8,0,0
int4_w4a8,torch.float16,14,256,7168,256,8,0,0
int4_w4a8,torch.float16,16,256,7168,256,8,0,0
int4_w4a8,torch.float16,20,256,7168,256,8,0,0
int4_w4a8,torch.float16,24,256,7168,256,8,0,0
int4_w4a8,torch.float16,28,256,7168,256,8,0,0
int4_w4a8,torch.float16,32,256,7168,256,8,0,0
int4_w4a8,torch.float16,36,256,7168,256,8,0,0
int4_w4a8,torch.float16,40,256,7168,256,8,0,0
int4_w4a8,torch.float16,44,256,7168,256,8,0,0
int4_w4a8,torch.float16,48,256,7168,256,8,0,0
int4_w4a8,torch.float16,56,256,7168,256,8,0,0
int4_w4a8,torch.float16,64,256,7168,256,8,0,0
int4_w4a8,torch.float16,72,256,7168,256,8,0,0
int4_w4a8,torch.float16,80,256,7168,256,8,0,0
int4_w4a8,torch.float16,96,256,7168,256,8,0,0
int4_w4a8,torch.float16,112,256,7168,256,8,0,0
int4_w4a8,torch.float16,128,256,7168,256,8,0,0
int4_w4a8,torch.float16,160,256,7168,256,8,0,0
int4_w4a8,torch.float16,192,256,7168,256,8,0,0
int4_w4a8,torch.float16,224,256,7168,256,8,0,0
int4_w4a8,torch.float16,256,256,7168,256,8,0,0
int4_w4a8,torch.float16,320,256,7168,256,8,0,0
int4_w4a8,torch.float16,384,256,7168,256,8,0,0
int4_w4a8,torch.float16,448,256,7168,256,8,0,0
int4_w4a8,torch.float16,512,256,7168,256,8,0,0
int4_w4a8,torch.float16,576,256,7168,256,8,0,0
int4_w4a8,torch.float16,640,256,7168,256,8,0,0
int4_w4a8,torch.float16,704,256,7168,256,8,0,0
int4_w4a8,torch.float16,768,256,7168,256,8,0,0
int4_w4a8,torch.float16,832,256,7168,256,8,0,0
int4_w4a8,torch.float16,896,256,7168,256,8,0,0
int4_w4a8,torch.float16,960,256,7168,256,8,0,0
int4_w4a8,torch.float16,1024,256,7168,256,8,0,0
int4_w4a8,torch.float16,1152,256,7168,256,8,0,0
int4_w4a8,torch.float16,1280,256,7168,256,8,0,0
int4_w4a8,torch.float16,1408,256,7168,256,8,0,0
int4_w4a8,torch.float16,1536,256,7168,256,8,0,0
int4_w4a8,torch.float16,1664,256,7168,256,8,0,0
int4_w4a8,torch.float16,1792,256,7168,256,8,0,0
int4_w4a8,torch.float16,1920,256,7168,256,8,0,0
int4_w4a8,torch.float16,2048,256,7168,256,8,0,0
int4_w4a8,torch.float16,2304,256,7168,256,8,0,0
int4_w4a8,torch.float16,2560,256,7168,256,8,0,0
int4_w4a8,torch.float16,2816,256,7168,256,8,0,0
int4_w4a8,torch.float16,3072,256,7168,256,8,0,0
int4_w4a8,torch.float16,3328,256,7168,256,8,0,0
int4_w4a8,torch.float16,3584,256,7168,256,8,0,0
int4_w4a8,torch.float16,3840,256,7168,256,8,0,0
int4_w4a8,torch.float16,4096,256,7168,256,8,0,0
int4_w4a8,torch.float16,4608,256,7168,256,8,0,0
int4_w4a8,torch.float16,5120,256,7168,256,8,0,0
int4_w4a8,torch.float16,5632,256,7168,256,8,0,0
int4_w4a8,torch.float16,6144,256,7168,256,8,0,0
int4_w4a8,torch.float16,6656,256,7168,256,8,0,0
int4_w4a8,torch.float16,7168,256,7168,256,8,0,0
int4_w4a8,torch.float16,7680,256,7168,256,8,0,0
int4_w4a8,torch.float16,8192,256,7168,256,8,0,0
int4_w4a8,torch.float16,10240,256,7168,256,8,0,0
int4_w4a8,torch.float16,12288,256,7168,256,8,0,0
int4_w4a8,torch.float16,14336,256,7168,256,8,0,0
int4_w4a8,torch.float16,16384,256,7168,256,8,0,0
int4_w4a8,torch.float16,17408,256,7168,256,8,0,0
int4_w4a8,torch.float16,24576,256,7168,256,8,0,0
int4_w4a8,torch.float16,32768,256,7168,256,8,0,0
int4_w4a8,torch.float16,1,128,7168,256,8,0,0
int4_w4a8,torch.float16,8,128,7168,256,8,0,0
int4_w4a8,torch.float16,32,128,7168,256,8,0,0
int4_w4a8,torch.float16,48,128,7168,256,8,0,0
int4_w4a8,torch.float16,64,128,7168,256,8,0,0
int4_w4a8,torch.float16,80,128,7168,256,8,0,0
int4_w4a8,torch.float16,96,128,7168,256,8,0,0
int4_w4a8,torch.float16,128,128,7168,256,8,0,0
int4_w4a8,torch.float16,256,128,7168,256,8,0,0
int4_w4a8,torch.float16,512,128,7168,256,8,0,0
int4_w4a8,torch.float16,768,128,7168,256,8,0,0
int4_w4a8,torch.float16,1024,128,7168,256,8,0,0
int4_w4a8,torch.float16,2048,128,7168,256,8,0,0
int4_w4a8,torch.float16,3072,128,7168,256,8,0,0
int4_w4a8,torch.float16,4096,128,7168,256,8,0,0
int4_w4a8,torch.float16,5120,128,7168,256,8,0,0
int4_w4a8,torch.float16,6144,128,7168,256,8,0,0
int4_w4a8,torch.float16,8192,128,7168,256,8,0,0
int4_w4a8,torch.float16,10240,128,7168,256,8,0,0
int4_w4a8,torch.float16,12288,128,7168,256,8,0,0
int4_w4a8,torch.float16,16384,128,7168,256,8,0,0
int4_w4a8,torch.float16,24576,128,7168,256,8,0,0
int4_w4a8,torch.float16,32768,128,7168,256,8,0,0
\ No newline at end of file
quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k
f8_w8a8_channel,torch.float16,1,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,4,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,5,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,6,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,7,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,8,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,9,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,10,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,11,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,12,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,13,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,14,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,15,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,16,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,17,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,18,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,20,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,24,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,28,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,32,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,34,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,36,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,40,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,44,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,48,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,56,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,64,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,68,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,72,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,80,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,88,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,96,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,104,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,112,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,128,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,144,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,160,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,192,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,224,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,256,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,320,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,384,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,448,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,512,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,576,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,640,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,704,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,768,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,832,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,896,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,960,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1024,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1152,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1280,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1408,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1536,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1664,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1792,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1920,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2048,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2304,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2560,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2816,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3072,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3328,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3584,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3840,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,4096,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,4608,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,5120,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,5632,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,6144,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,6656,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,7168,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,7680,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,8192,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,10240,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,12288,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,14336,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,16384,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,17408,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,24576,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,32768,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,40960,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,49152,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,57344,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,65536,128,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,4,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,5,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,6,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,7,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,8,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,9,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,10,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,11,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,12,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,13,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,14,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,15,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,16,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,17,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,18,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,20,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,24,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,28,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,32,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,34,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,36,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,40,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,44,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,48,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,56,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,64,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,68,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,72,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,80,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,88,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,96,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,104,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,112,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,128,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,144,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,160,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,192,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,224,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,256,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,320,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,384,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,448,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,512,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,576,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,640,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,704,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,768,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,832,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,896,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,960,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1024,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1152,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1280,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1408,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1536,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1664,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1792,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,1920,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2048,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2304,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2560,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,2816,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3072,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3328,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3584,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,3840,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,4096,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,4608,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,5120,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,5632,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,6144,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,6656,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,7168,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,7680,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,8192,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,10240,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,12288,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,14336,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,16384,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,17408,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,24576,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,32768,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,40960,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,49152,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,57344,256,7168,256,8,0,0
f8_w8a8_channel,torch.float16,65536,256,7168,256,8,0,0
\ No newline at end of file
quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k
f8_w8a8_block,torch.float16,1,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,2,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,3,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,4,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,5,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,6,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,7,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,8,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,9,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,10,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,11,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,12,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,13,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,14,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,15,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,16,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,17,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,18,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,20,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,24,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,28,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,32,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,34,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,36,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,40,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,44,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,48,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,56,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,64,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,68,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,72,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,80,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,88,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,96,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,104,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,112,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,128,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,144,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,160,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,192,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,224,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,256,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,320,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,384,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,448,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,512,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,576,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,640,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,704,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,768,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,832,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,896,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,960,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1024,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1152,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1280,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1408,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1536,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1664,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1792,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1920,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,2048,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,2304,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,2560,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,2816,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,3072,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,3328,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,3584,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,3840,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,4096,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,4608,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,5120,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,5632,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,6144,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,6656,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,7168,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,7680,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,8192,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,10240,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,12288,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,14336,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,16384,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,17408,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,24576,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,32768,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,40960,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,49152,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,57344,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,65536,128,7168,256,8,0,0
f8_w8a8_block,torch.float16,1,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,2,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,3,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,4,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,5,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,6,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,7,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,8,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,9,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,10,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,11,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,12,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,13,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,14,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,15,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,16,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,17,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,18,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,20,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,24,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,28,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,32,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,34,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,36,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,40,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,44,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,48,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,56,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,64,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,68,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,72,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,80,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,88,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,96,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,104,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,112,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,128,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,144,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,160,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,192,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,224,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,256,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,320,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,384,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,448,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,512,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,576,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,640,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,704,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,768,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,832,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,896,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,960,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1024,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1152,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1280,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1408,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1536,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1664,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1792,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,1920,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,2048,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,2304,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,2560,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,2816,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,3072,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,3328,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,3584,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,3840,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,4096,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,4608,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,5120,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,5632,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,6144,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,6656,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,7168,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,7680,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,8192,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,10240,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,12288,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,14336,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,16384,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,17408,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,24576,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,32768,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,40960,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,49152,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,57344,256,7168,256,8,0,0
f8_w8a8_block,torch.float16,65536,256,7168,256,8,0,0
\ No newline at end of file
quant_type,indtype,token,inter_dim,model_dim,expert,topk,q_size_n,q_size_k
no_quant,torch.float16,1,256,8192,256,4,0,0
no_quant,torch.float16,8,256,8192,256,4,0,0
no_quant,torch.float16,16,256,8192,256,4,0,0
no_quant,torch.float16,24,256,8192,256,4,0,0
no_quant,torch.float16,32,256,8192,256,4,0,0
no_quant,torch.float16,48,256,8192,256,4,0,0
no_quant,torch.float16,64,256,8192,256,4,0,0
no_quant,torch.float16,96,256,8192,256,4,0,0
no_quant,torch.float16,128,256,8192,256,4,0,0
no_quant,torch.float16,256,256,8192,256,4,0,0
no_quant,torch.float16,512,256,8192,256,4,0,0
no_quant,torch.float16,1024,256,8192,256,4,0,0
no_quant,torch.float16,2048,256,8192,256,4,0,0
no_quant,torch.float16,4096,256,8192,256,4,0,0
no_quant,torch.float16,8192,256,8192,256,4,0,0
no_quant,torch.float16,1,256,7168,256,8,0,0
no_quant,torch.float16,8,256,7168,256,8,0,0
no_quant,torch.float16,16,256,7168,256,8,0,0
no_quant,torch.float16,24,256,7168,256,8,0,0
no_quant,torch.float16,32,256,7168,256,8,0,0
no_quant,torch.float16,48,256,7168,256,8,0,0
no_quant,torch.float16,64,256,7168,256,8,0,0
no_quant,torch.float16,96,256,7168,256,8,0,0
no_quant,torch.float16,128,256,7168,256,8,0,0
no_quant,torch.float16,256,256,7168,256,8,0,0
no_quant,torch.float16,512,256,7168,256,8,0,0
no_quant,torch.float16,1024,256,7168,256,8,0,0
no_quant,torch.float16,2048,256,7168,256,8,0,0
no_quant,torch.float16,4096,256,7168,256,8,0,0
no_quant,torch.float16,8192,256,7168,256,8,0,0
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment