default.yaml 750 Bytes
Newer Older
1
# SuperBench Config
2
superbench:
3
  enable: null
4
  benchmarks:
5
    matmul:
6
      enable: true
7
8
9
10
11
      modes:
        - name: local
          proc_num: 8
          prefix: CUDA_VISIBLE_DEVICES={proc_rank}
          parallel: no
12
13
      frameworks:
        - pytorch
14
      parameters:
15
16
17
        num_steps: 2048
    bert_models:
      enable: true
18
19
20
21
      modes:
        - name: torch.distributed
          proc_num: 8
          node_num: all
22
23
24
25
26
27
28
29
30
      frameworks:
        - pytorch
      models:
        - bert-base
        - bert-large
      parameters:
        duration: 0
        num_warmup: 64
        num_steps: 2048
31
        batch_size: 16
32
33
34
35
36
37
        precision:
          - float32
          - float16
        model_action:
          - train
          - inference