deepspeed_config.json 526 Bytes
Newer Older
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
{
  "optimizer": {
    "type": "Adam",
    "params": {
      "lr": 0.001,
      "eps": 1e-05
    }
  },
  "fp16": {
    "enabled": true,
    "min_loss_scale": 1
  },
  "amp": {
    "enabled": false,
    "opt_level": "O2"
  },
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
17
18
19
  "bfloat16": {
    "enabled": false
  },
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
20
  "zero_optimization": {
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
21
22
23
    "stage": 2,
    "cpu_offload": true,
    "contiguous_gradients": true
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
24
25
26
27
28
29
30
31
  },
  "activation_checkpointing": {
    "partition_activations": true,
    "cpu_checkpointing": false,
    "profile": false
  },
  "gradient_clipping": 0.1
}