group_gemm.json 338 Bytes
Newer Older
sunzhq2's avatar
init  
sunzhq2 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
{
  "operator": "group_gemm", 
  "iterations": 100, 
  "input_shape_groups": {
    "gemm_group": [1, 2, 3, 4, 5, 6, 7, 8],
    "batch": [1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192],
    "KN": [[32, 16384], [16384, 32], [16384, 16384]]
  },
  "dtype": [ 
    "float32", 
    "bfloat16", 
    "float16", 
    "int8"
  ]
}