Unverified Commit 1d09b111 authored by Hongtao Zhang's avatar Hongtao Zhang Committed by GitHub
Browse files

Microbenchmark - Add arch support for 10.0 in gemm-flops (#680)

**Description**
Introduce architecture support for version 10.0 in gemm-flops.
parent 424f7b5b
...@@ -24,7 +24,8 @@ def __init__(self, name, parameters=''): ...@@ -24,7 +24,8 @@ def __init__(self, name, parameters=''):
self._bin_name = 'cutlass_profiler' self._bin_name = 'cutlass_profiler'
# TODO - To support more architecutres, currently only support compute capability = 7.0, 7.5, 8.0, 8.6 # TODO - To support more architectures
# Currently only support compute capability = 7.0, 7.5, 8.0, 8.6, 8.9, 9.0, 10.0
self.__kernel_map = { self.__kernel_map = {
7.0: { 7.0: {
'fp64': 'cutlass_simt_dgemm_128x128_8x2_*', 'fp64': 'cutlass_simt_dgemm_128x128_8x2_*',
...@@ -51,6 +52,7 @@ def __init__(self, name, parameters=''): ...@@ -51,6 +52,7 @@ def __init__(self, name, parameters=''):
self.__kernel_map[8.9] = {k: self.__kernel_map[8.0][k] for k in self.__kernel_map[8.0] if 'fp64' not in k} self.__kernel_map[8.9] = {k: self.__kernel_map[8.0][k] for k in self.__kernel_map[8.0] if 'fp64' not in k}
# Skip INT4 for Hopper due to no native CUDA/Tensor Cores # Skip INT4 for Hopper due to no native CUDA/Tensor Cores
self.__kernel_map[9.0] = {k: self.__kernel_map[8.0][k] for k in self.__kernel_map[8.0] if 'int4_tc' not in k} self.__kernel_map[9.0] = {k: self.__kernel_map[8.0][k] for k in self.__kernel_map[8.0] if 'int4_tc' not in k}
self.__kernel_map[10.0] = {k: self.__kernel_map[8.0][k] for k in self.__kernel_map[8.0] if 'int4_tc' not in k}
self.__parse_logline = [ self.__parse_logline = [
'gemm,cutlass_simt_dgemm_128x128_8x2', 'gemm,cutlass_simt_sgemm_128x128_8x2', 'gemm,cutlass_simt_dgemm_128x128_8x2', 'gemm,cutlass_simt_sgemm_128x128_8x2',
'gemm,cutlass_simt_hgemm_256x128_8x2', 'gemm,cutlass_tensorop_d884gemm_128x128_16x3', 'gemm,cutlass_simt_hgemm_256x128_8x2', 'gemm,cutlass_tensorop_d884gemm_128x128_16x3',
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment