__init__.py 5.19 KB
Newer Older
1
2
3
4
5
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT License.

"""A module containing all the micro-benchmarks."""

6
from superbench.benchmarks.micro_benchmarks.micro_base import MicroBenchmark, MicroBenchmarkWithInvoke
7
8
from superbench.benchmarks.micro_benchmarks.gemm_flops_performance_base import GemmFlopsBenchmark
from superbench.benchmarks.micro_benchmarks.memory_bw_performance_base import MemBwBenchmark
one's avatar
one committed
9
from superbench.benchmarks.micro_benchmarks.gpu_hpcg_performance_base import GpuHpcgBenchmark
10
from superbench.benchmarks.micro_benchmarks.gpu_hpl_performance_base import GpuHplBenchmark
11

12
from superbench.benchmarks.micro_benchmarks.computation_communication_overlap import ComputationCommunicationOverlap
13
from superbench.benchmarks.micro_benchmarks.cublas_function import CublasBenchmark
14
from superbench.benchmarks.micro_benchmarks.blaslt_function_base import BlasLtBaseBenchmark
15
from superbench.benchmarks.micro_benchmarks.cublaslt_function import CublasLtBenchmark
16
17
from superbench.benchmarks.micro_benchmarks.rocm_hipblaslt_function import RocmHipBlasLtBenchmark
from superbench.benchmarks.micro_benchmarks.dtk_hipblaslt_function import DtkHipBlasLtBenchmark
one's avatar
one committed
18
from superbench.benchmarks.micro_benchmarks.dtk_memory_bw_performance import DtkMemBwBenchmark
one's avatar
one committed
19
from superbench.benchmarks.micro_benchmarks.dtk_gemm_flops_performance import DtkGemmFlopsBenchmark
one's avatar
one committed
20
from superbench.benchmarks.micro_benchmarks.dtk_hpcg_performance import DtkHpcgBenchmark
21
22
from superbench.benchmarks.micro_benchmarks.dtk_hpl_performance import DtkHplBenchmark
from superbench.benchmarks.micro_benchmarks.dtk_hpl_mxp_performance import DtkHplMxpBenchmark
23
from superbench.benchmarks.micro_benchmarks.cuda_gemm_flops_performance import CudaGemmFlopsBenchmark
24
from superbench.benchmarks.micro_benchmarks.cuda_memory_bw_performance import CudaMemBwBenchmark
25
26
from superbench.benchmarks.micro_benchmarks.cuda_nccl_bw_performance import CudaNcclBwBenchmark
from superbench.benchmarks.micro_benchmarks.cudnn_function import CudnnBenchmark
27
from superbench.benchmarks.micro_benchmarks.disk_performance import DiskBenchmark
28
from superbench.benchmarks.micro_benchmarks.dist_inference import DistInference
29
from superbench.benchmarks.micro_benchmarks.cpu_memory_bw_latency_performance import CpuMemBwLatencyBenchmark
rafsalas19's avatar
rafsalas19 committed
30
from superbench.benchmarks.micro_benchmarks.cpu_stream_performance import CpuStreamBenchmark
rafsalas19's avatar
rafsalas19 committed
31
from superbench.benchmarks.micro_benchmarks.cpu_hpl_performance import CpuHplBenchmark
32
33
from superbench.benchmarks.micro_benchmarks.gpcnet_performance import GPCNetBenchmark
from superbench.benchmarks.micro_benchmarks.gpu_copy_bw_performance import GpuCopyBwBenchmark
34
from superbench.benchmarks.micro_benchmarks.gpu_stream import GpuStreamBenchmark
35
from superbench.benchmarks.micro_benchmarks.gpu_burn_test import GpuBurnBenchmark
36
from superbench.benchmarks.micro_benchmarks.ib_loopback_performance import IBLoopbackBenchmark
37
from superbench.benchmarks.micro_benchmarks.ib_validation_performance import IBBenchmark
38
from superbench.benchmarks.micro_benchmarks.kernel_launch_overhead import KernelLaunch
39
from superbench.benchmarks.micro_benchmarks.ort_inference_performance import ORTInferenceBenchmark
40
41
42
from superbench.benchmarks.micro_benchmarks.rocm_gemm_flops_performance import RocmGemmFlopsBenchmark
from superbench.benchmarks.micro_benchmarks.rocm_memory_bw_performance import RocmMemBwBenchmark
from superbench.benchmarks.micro_benchmarks.sharding_matmul import ShardingMatmul
43
from superbench.benchmarks.micro_benchmarks.tcp_connectivity import TCPConnectivityBenchmark
44
from superbench.benchmarks.micro_benchmarks.tensorrt_inference_performance import TensorRTInferenceBenchmark
45
from superbench.benchmarks.micro_benchmarks.directx_gpu_encoding_latency import DirectXGPUEncodingLatency
46
from superbench.benchmarks.micro_benchmarks.directx_gpu_copy_performance import DirectXGPUCopyBw
47
from superbench.benchmarks.micro_benchmarks.directx_mem_bw_performance import DirectXGPUMemBw
48
from superbench.benchmarks.micro_benchmarks.directx_gemm_flops_performance import DirectXGPUCoreFlops
49
from superbench.benchmarks.micro_benchmarks.nvbandwidth import NvBandwidthBenchmark
50

51
__all__ = [
52
    'BlasLtBaseBenchmark',
53
    'ComputationCommunicationOverlap',
54
    'CpuMemBwLatencyBenchmark',
rafsalas19's avatar
rafsalas19 committed
55
    'CpuHplBenchmark',
rafsalas19's avatar
rafsalas19 committed
56
    'CpuStreamBenchmark',
57
    'CublasBenchmark',
58
    'CublasLtBenchmark',
59
60
61
62
63
    'CudaGemmFlopsBenchmark',
    'CudaMemBwBenchmark',
    'CudaNcclBwBenchmark',
    'CudnnBenchmark',
    'DiskBenchmark',
64
    'DistInference',
one's avatar
one committed
65
    'DtkGemmFlopsBenchmark',
66
67
    'DtkHplBenchmark',
    'DtkHplMxpBenchmark',
68
69
    'RocmHipBlasLtBenchmark',
    'DtkHipBlasLtBenchmark',
one's avatar
one committed
70
    'DtkMemBwBenchmark',
71
72
    'GPCNetBenchmark',
    'GemmFlopsBenchmark',
73
    'GpuBurnBenchmark',
74
    'GpuCopyBwBenchmark',
one's avatar
one committed
75
    'GpuHpcgBenchmark',
76
    'GpuHplBenchmark',
77
    'GpuStreamBenchmark',
78
79
80
81
82
83
    'IBBenchmark',
    'IBLoopbackBenchmark',
    'KernelLaunch',
    'MemBwBenchmark',
    'MicroBenchmark',
    'MicroBenchmarkWithInvoke',
84
    'ORTInferenceBenchmark',
85
86
87
88
89
    'RocmGemmFlopsBenchmark',
    'RocmMemBwBenchmark',
    'ShardingMatmul',
    'TCPConnectivityBenchmark',
    'TensorRTInferenceBenchmark',
90
    'DirectXGPUEncodingLatency',
91
    'DirectXGPUCopyBw',
92
    'DirectXGPUMemBw',
93
    'DirectXGPUCoreFlops',
one's avatar
one committed
94
    'DtkHpcgBenchmark',
95
    'NvBandwidthBenchmark',
96
]