hipblaslt.config 4.42 KB
Newer Older
sunzhq2's avatar
sunzhq2 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
Git Version: 4bd05bb5-dirty
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,128,128,128,1,128,16384,0,128,16384,128,16384,128,16384,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,624.226,6.71921,4452,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,256,256,256,1,256,65536,0,256,65536,256,65536,256,65536,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,4403.76,7.6195,4452,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,512,512,512,1,512,262144,0,512,262144,512,262144,512,262144,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,26791.3,10.0195,4500,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,1024,1024,1024,1,1024,1048576,0,1024,1048576,1024,1048576,1024,1048576,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,108893,19.721,4456,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,2048,2048,2048,1,2048,4194304,0,2048,4194304,2048,4194304,2048,4194304,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,315119,54.5186,4477,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,4096,4096,4096,1,4096,16777216,0,4096,16777216,4096,16777216,4096,16777216,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,475043,289.319,4478,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,8192,8192,8192,1,8192,67108864,0,8192,67108864,8192,67108864,8192,67108864,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,674829,1629.32,4479,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,4098,4098,4098,1,4098,16793604,0,4098,16793604,4098,16793604,4098,16793604,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,209556,656.819,4478,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,8190,8190,8190,1,8190,67076100,0,8190,67076100,8190,67076100,8190,67076100,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,266242,4126.72,4479,gfx936:sramecc+:xnack-,80
    transA,transB,grouped_gemm,batch_count,m,n,k,alpha,lda,stride_a,beta,ldb,stride_b,ldc,stride_c,ldd,stride_d,a_type,b_type,c_type,d_type,compute_type,scaleA,scaleB,scaleC,scaleD,amaxD,activation_type,bias_vector,bias_type,hipblaslt-Gflops,us,solution_index,gcnArchName,CUs
    T,N,0,1,8192,8192,768,1,8192,67108864,0,768,6291456,8192,67108864,8192,67108864,i8_r,i8_r,i32_r,f16_r,i32_r,2,2,0,0,0,,1,f16_r,277453,371.519,4484,gfx936:sramecc+:xnack-,80