nccl_bw_performance.py 1016 Bytes
Newer Older
1
2
3
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT license.

4
"""Micro benchmark example for NCCL/RCCL Bus bandwidth performance.
5
6
7
8
9
10
11
12
13
14
15
16

Commands to run:
  python3 examples/benchmarks/nccl_bw_performance.py
"""

from superbench.benchmarks import BenchmarkRegistry, Platform
from superbench.common.utils import logger

if __name__ == '__main__':
    context = BenchmarkRegistry.create_benchmark_context(
        'nccl-bw', platform=Platform.CUDA, parameters='--operations allreduce'
    )
17
18
19
20
    # For ROCM environment, please specify the benchmark name and the platform as the following.
    # context = BenchmarkRegistry.create_benchmark_context(
    #     'rccl-bw', platform=Platform.ROCM, parameters='--operations allreduce --maxbytes 128M'
    # )
21
22
23
24
25
26
27
    benchmark = BenchmarkRegistry.launch_benchmark(context)
    if benchmark:
        logger.info(
            'benchmark: {}, return code: {}, result: {}'.format(
                benchmark.name, benchmark.return_code, benchmark.result
            )
        )