run_sweep.yaml 1.76 KB
Newer Older
sanchit-gandhi's avatar
sanchit-gandhi committed
1
2
3
4
5
command:
  - python3
  - ${program}
  - --load_best_model_at_end
  - --fp16
sanchit-gandhi's avatar
sanchit-gandhi committed
6
  - --fp16_full_eval
sanchit-gandhi's avatar
sanchit-gandhi committed
7
8
9
10
  - --do_train
  - --do_eval
  - --trust_remote_code
  - --overwrite_output_dir
sanchit-gandhi's avatar
sanchit-gandhi committed
11
  - --ignore_mismatched_sizes
sanchit-gandhi's avatar
sanchit-gandhi committed
12
  - --gradient_checkpointing
sanchit-gandhi's avatar
sanchit-gandhi committed
13
14
15
  - ${args}
method: grid
metric:
sanchit-gandhi's avatar
sanchit-gandhi committed
16
  goal: maximize
sanchit-gandhi's avatar
sanchit-gandhi committed
17
18
19
  name: eval/accuracy
parameters:
  model_name_or_path:
sanchit-gandhi's avatar
sanchit-gandhi committed
20
    value: facebook/mms-lid-126
sanchit-gandhi's avatar
sanchit-gandhi committed
21
  train_dataset_name:
sanchit-gandhi's avatar
sanchit-gandhi committed
22
    value: stable-speech/concatenated-accent-dataset
sanchit-gandhi's avatar
sanchit-gandhi committed
23
  train_dataset_config_name:
sanchit-gandhi's avatar
sanchit-gandhi committed
24
    value: default
sanchit-gandhi's avatar
sanchit-gandhi committed
25
  train_split_name:
sanchit-gandhi's avatar
sanchit-gandhi committed
26
    value: train
sanchit-gandhi's avatar
sanchit-gandhi committed
27
  train_label_column_name:
sanchit-gandhi's avatar
sanchit-gandhi committed
28
    value: labels
sanchit-gandhi's avatar
sanchit-gandhi committed
29
  eval_dataset_name:
sanchit-gandhi's avatar
sanchit-gandhi committed
30
    value: stable-speech/concatenated-accent-dataset
sanchit-gandhi's avatar
sanchit-gandhi committed
31
32
33
34
35
  eval_dataset_config_name:
    value: default
  eval_split_name:
    value: test
  eval_label_column_name:
sanchit-gandhi's avatar
sanchit-gandhi committed
36
    value: labels
sanchit-gandhi's avatar
sanchit-gandhi committed
37
38
39
40
41
42
  output_dir:
    value: ./
  remove_unused_columns:
    value: false
  learning_rate:
    value: 1e-4
sanchit-gandhi's avatar
sanchit-gandhi committed
43
44
  lr_scheduler_type:
    value: constant_with_warmup
sanchit-gandhi's avatar
sanchit-gandhi committed
45
  max_length_seconds:
sanchit-gandhi's avatar
sanchit-gandhi committed
46
    value: 20  # give some data diversity for longer audio samples
sanchit-gandhi's avatar
sanchit-gandhi committed
47
  min_length_seconds:
sanchit-gandhi's avatar
sanchit-gandhi committed
48
    value: 7
sanchit-gandhi's avatar
sanchit-gandhi committed
49
  attention_mask:
sanchit-gandhi's avatar
sanchit-gandhi committed
50
    value: true
sanchit-gandhi's avatar
sanchit-gandhi committed
51
  warmup_steps:
sanchit-gandhi's avatar
sanchit-gandhi committed
52
    value: 100
sanchit-gandhi's avatar
sanchit-gandhi committed
53
  max_steps:
sanchit-gandhi's avatar
sanchit-gandhi committed
54
    value: 2000
sanchit-gandhi's avatar
sanchit-gandhi committed
55
56
57
  per_device_train_batch_size:
    value: 32
  per_device_eval_batch_size:
sanchit-gandhi's avatar
sanchit-gandhi committed
58
    value: 16
sanchit-gandhi's avatar
sanchit-gandhi committed
59
  preprocessing_num_workers:
sanchit-gandhi's avatar
sanchit-gandhi committed
60
    value: 4
sanchit-gandhi's avatar
sanchit-gandhi committed
61
  dataloader_num_workers:
sanchit-gandhi's avatar
sanchit-gandhi committed
62
    value: 4
sanchit-gandhi's avatar
sanchit-gandhi committed
63
64
65
66
67
  logging_strategy:
    value: steps
  logging_steps:
    value: 10
  evaluation_strategy:
sanchit-gandhi's avatar
sanchit-gandhi committed
68
69
    value: steps
  eval_steps:
sanchit-gandhi's avatar
sanchit-gandhi committed
70
    value: 1000
sanchit-gandhi's avatar
sanchit-gandhi committed
71
  save_strategy:
sanchit-gandhi's avatar
sanchit-gandhi committed
72
73
    value: steps
  save_steps:
sanchit-gandhi's avatar
sanchit-gandhi committed
74
    value: 2000
sanchit-gandhi's avatar
sanchit-gandhi committed
75
76
77
  metric_for_best_model:
    value: accuracy
  freeze_base_model:
sanchit-gandhi's avatar
sanchit-gandhi committed
78
79
80
81
82
    values:
     - false
     - true
  group_by_length:
    value: false  # TODO(SG): batch by length
sanchit-gandhi's avatar
sanchit-gandhi committed
83
84
85
86
  push_to_hub:
    value: false
program: run_audio_classification.py
project: mms-lid-accent-classification