optKernelManifest.json 1.46 KB
Newer Older
Xiaowei.zhang's avatar
Xiaowei.zhang committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
{
  "w4a16": {
    "NN": {
      "kernel_name": "Cijk_Ailk_Bljk_HHS_BH_UserArgs_MT128x32x32_SN_K1_PGR6_SB1_TT8_2_WG16_16_2",
      "co_file": "Cijk_Ailk_Bljk_HHS_BH_UserArgs_MT128x32x32_SN_K1_PGR6_SB1_TT8_2_stru_debug.co",
      "Kconfigs": { "mt0": 128, "mt1": 32, "numThreads": 512, "wgm": 1 }
    },
    "TN": {
      "kernel_name": "Cijk_Alik_Bljk_HHS_BH_UserArgs_MT32x32x128_SN_K1_PGR4_TT2_2_WG16_16_2",
      "co_file": "Cijk_Alik_Bljk_HHS_BH_UserArgs_MT32x32x128_SN_K1_PGR4_TT2_2_awqGemm.co",
      "Kconfigs": { "mt0": 32, "mt1": 32, "numThreads": 512, "wgm": 1 }
    }
  },
  "fused_w4a16": {
    "TN": {
      "kernel_name": "Cijk_Alik_Bljk_HHS_BH_UserArgs_MT32x32x128_SN_K1_PGR4_TT2_2_WG16_16_2",
      "co_file": "Cijk_Alik_Bljk_HHS_BH_UserArgs_MT32x32x128_SN_K1_PGR4_TT2_2_vllm_awqGemm_fused.co",
      "Kconfigs": { "mt0": 32, "mt1": 32, "numThreads": 512, "wgm": 1 }
    },
    "modify_to_TN_if_needed": {
      "kernel_name": "Cijk_Alik_Bljk_HHS_BH_UserArgs_MT32x1024x16_SN_K1_TT2_64_WG16_16_3_WGM1",
      "co_file": "Cijk_Alik_Bljk_HHS_BH_UserArgs_MT32x1024x16_SN_K1_TT2_16_WG16_16_3_WGM1_vllm_awqGemm.co",
      "Kconfigs": { "mt0": 32, "mt1": 1024, "numThreads": 768, "wgm": 1 }
    },
    "NN": {
      "kernel_name": "Cijk_Ailk_Bljk_HHS_BH_UserArgs_MT64x32x32_SN_K1_PGR6_SB1_TT2_2_WG16_16_2",
      "co_file": "Cijk_Ailk_Bljk_HHS_BH_UserArgs_MT64x32x32_SN_K1_PGR6_SB1_TT4_2_w4a16.co",
      "Kconfigs": { "mt0": 64, "mt1": 32, "numThreads": 512, "wgm": 1 }
    }
  }
}