__init__.py 3.22 KB
Newer Older
1
2
3
4
5
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT License.

"""A module containing all the micro-benchmarks."""

6
from superbench.benchmarks.micro_benchmarks.micro_base import MicroBenchmark, MicroBenchmarkWithInvoke
7
8
9
from superbench.benchmarks.micro_benchmarks.gemm_flops_performance_base import GemmFlopsBenchmark
from superbench.benchmarks.micro_benchmarks.memory_bw_performance_base import MemBwBenchmark

10
from superbench.benchmarks.micro_benchmarks.computation_communication_overlap import ComputationCommunicationOverlap
11
from superbench.benchmarks.micro_benchmarks.cublas_function import CublasBenchmark
12
from superbench.benchmarks.micro_benchmarks.cublaslt_function import CublasLtBenchmark
13
from superbench.benchmarks.micro_benchmarks.cuda_gemm_flops_performance import CudaGemmFlopsBenchmark
14
from superbench.benchmarks.micro_benchmarks.cuda_memory_bw_performance import CudaMemBwBenchmark
15
16
from superbench.benchmarks.micro_benchmarks.cuda_nccl_bw_performance import CudaNcclBwBenchmark
from superbench.benchmarks.micro_benchmarks.cudnn_function import CudnnBenchmark
17
from superbench.benchmarks.micro_benchmarks.disk_performance import DiskBenchmark
18
from superbench.benchmarks.micro_benchmarks.cpu_memory_bw_latency_performance import CpuMemBwLatencyBenchmark
rafsalas19's avatar
rafsalas19 committed
19
from superbench.benchmarks.micro_benchmarks.cpu_stream_performance import CpuStreamBenchmark
rafsalas19's avatar
rafsalas19 committed
20
from superbench.benchmarks.micro_benchmarks.cpu_hpl_performance import CpuHplBenchmark
21
22
from superbench.benchmarks.micro_benchmarks.gpcnet_performance import GPCNetBenchmark
from superbench.benchmarks.micro_benchmarks.gpu_copy_bw_performance import GpuCopyBwBenchmark
23
from superbench.benchmarks.micro_benchmarks.gpu_burn_test import GpuBurnBenchmark
24
from superbench.benchmarks.micro_benchmarks.ib_loopback_performance import IBLoopbackBenchmark
25
from superbench.benchmarks.micro_benchmarks.ib_validation_performance import IBBenchmark
26
from superbench.benchmarks.micro_benchmarks.kernel_launch_overhead import KernelLaunch
27
from superbench.benchmarks.micro_benchmarks.ort_inference_performance import ORTInferenceBenchmark
28
29
30
from superbench.benchmarks.micro_benchmarks.rocm_gemm_flops_performance import RocmGemmFlopsBenchmark
from superbench.benchmarks.micro_benchmarks.rocm_memory_bw_performance import RocmMemBwBenchmark
from superbench.benchmarks.micro_benchmarks.sharding_matmul import ShardingMatmul
31
from superbench.benchmarks.micro_benchmarks.tcp_connectivity import TCPConnectivityBenchmark
32
from superbench.benchmarks.micro_benchmarks.tensorrt_inference_performance import TensorRTInferenceBenchmark
33

34
__all__ = [
35
    'ComputationCommunicationOverlap',
36
    'CpuMemBwLatencyBenchmark',
rafsalas19's avatar
rafsalas19 committed
37
    'CpuHplBenchmark',
rafsalas19's avatar
rafsalas19 committed
38
    'CpuStreamBenchmark',
39
    'CublasBenchmark',
40
    'CublasLtBenchmark',
41
42
43
44
45
46
47
    'CudaGemmFlopsBenchmark',
    'CudaMemBwBenchmark',
    'CudaNcclBwBenchmark',
    'CudnnBenchmark',
    'DiskBenchmark',
    'GPCNetBenchmark',
    'GemmFlopsBenchmark',
48
    'GpuBurnBenchmark',
49
    'GpuCopyBwBenchmark',
50
51
52
53
54
55
    'IBBenchmark',
    'IBLoopbackBenchmark',
    'KernelLaunch',
    'MemBwBenchmark',
    'MicroBenchmark',
    'MicroBenchmarkWithInvoke',
56
    'ORTInferenceBenchmark',
57
58
59
60
61
    'RocmGemmFlopsBenchmark',
    'RocmMemBwBenchmark',
    'ShardingMatmul',
    'TCPConnectivityBenchmark',
    'TensorRTInferenceBenchmark',
62
]