gpt3l-flash-8k.yaml 224 Bytes
Newer Older
Tri Dao's avatar
Tri Dao committed
1
2
3
4
5
6
7
8
9
10
# @package _global_
defaults:
  - /experiment/pile/gpt3l-flash.yaml

datamodule:
  max_length: 8192
  batch_size: ${eval:"1 if ${train.gpu_mem} < 40 else (2 if ${train.gpu_mem} < 80 else 4)"}

train:
  global_batch_size: 64