sft_dataset.yaml 350 Bytes
Newer Older
xingjinliang's avatar
xingjinliang committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
__module__: megatron.energon
__class__: Metadataset
splits:
  train:
    datasets:
      - weight: 1.
        path: <path_to_sft_dataset_in_energon_format>
        subflavors:
          augmentation: false
  val:
    datasets:
      - weight: 1.
        path: <path_to_sft_dataset_in_energon_format>
        subflavors:
          augmentation: false