"vscode:/vscode.git/clone" did not exist on "44c10a3afc6d9bc2f457ad3f8266a83de5f9b312"
deepspeed_config.json 424 Bytes
Newer Older
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
1
2
{
  "fp16": {
3
    "enabled": false,
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
4
5
6
7
8
9
    "min_loss_scale": 1
  },
  "amp": {
    "enabled": false,
    "opt_level": "O2"
  },
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
10
  "bfloat16": {
11
    "enabled": true
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
12
  },
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
13
  "zero_optimization": {
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
14
15
16
    "stage": 2,
    "cpu_offload": true,
    "contiguous_gradients": true
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
17
18
19
20
21
22
23
24
  },
  "activation_checkpointing": {
    "partition_activations": true,
    "cpu_checkpointing": false,
    "profile": false
  },
  "gradient_clipping": 0.1
}