sft_dataset.yaml 342 Bytes
Newer Older
wangsen's avatar
wangsen committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
__module__: megatron.energon
__class__: Metadataset
splits:
  train:
    datasets:
      - weight: 1.
        path: /workspace/data/sft/train/dataset
        subflavors:
          augmentation: false
  val:
    datasets:
      - weight: 1.
        path: /workspace/data/sft/validation/dataset
        subflavors:
          augmentation: false