run_sweep.yaml 1.76 KB
Newer Older
sanchit-gandhi's avatar
sanchit-gandhi committed
1
2
3
4
5
command:
  - python3
  - ${program}
  - --load_best_model_at_end
  - --fp16
sanchit-gandhi's avatar
sanchit-gandhi committed
6
  - --fp16_full_eval
sanchit-gandhi's avatar
sanchit-gandhi committed
7
8
9
10
  - --do_train
  - --do_eval
  - --trust_remote_code
  - --overwrite_output_dir
sanchit-gandhi's avatar
sanchit-gandhi committed
11
  - --ignore_mismatched_sizes
sanchit-gandhi's avatar
sanchit-gandhi committed
12
  - --gradient_checkpointing
sanchit-gandhi's avatar
sanchit-gandhi committed
13
14
15
  - ${args}
method: grid
metric:
sanchit-gandhi's avatar
sanchit-gandhi committed
16
  goal: maximize
sanchit-gandhi's avatar
sanchit-gandhi committed
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
  name: eval/accuracy
parameters:
  model_name_or_path:
    values:
      - facebook/mms-lid-126
      - openai/whisper-large-v3
  train_dataset_name:
    value: sanchit-gandhi/vctk+facebook/voxpopuli+sanchit-gandhi/edacc
  train_dataset_config_name:
    value: default+en_accented+default
  train_split_name:
    value: train+test+validation
  train_label_column_name:
    value: accent+accent+accent
  eval_dataset_name:
    value: sanchit-gandhi/edacc
  eval_dataset_config_name:
    value: default
  eval_split_name:
    value: test
  eval_label_column_name:
    value: accent
  output_dir:
    value: ./
  remove_unused_columns:
    value: false
  learning_rate:
    value: 1e-4
sanchit-gandhi's avatar
sanchit-gandhi committed
45
46
  lr_scheduler_type:
    value: constant_with_warmup
sanchit-gandhi's avatar
sanchit-gandhi committed
47
  max_length_seconds:
sanchit-gandhi's avatar
sanchit-gandhi committed
48
    value: 10  # give some data diversity for longer audio samples
sanchit-gandhi's avatar
sanchit-gandhi committed
49
50
  min_length_seconds:
    value: 5
sanchit-gandhi's avatar
sanchit-gandhi committed
51
52
  attention_mask:
    value: false
sanchit-gandhi's avatar
sanchit-gandhi committed
53
54
55
  warmup_steps:
    value: 50
  max_steps:
sanchit-gandhi's avatar
sanchit-gandhi committed
56
    value: 2000
sanchit-gandhi's avatar
sanchit-gandhi committed
57
58
59
  per_device_train_batch_size:
    value: 32
  per_device_eval_batch_size:
sanchit-gandhi's avatar
sanchit-gandhi committed
60
    value: 16
sanchit-gandhi's avatar
sanchit-gandhi committed
61
62
63
  preprocessing_num_workers:
    value: 16
  dataloader_num_workers:
sanchit-gandhi's avatar
sanchit-gandhi committed
64
    value: 4
sanchit-gandhi's avatar
sanchit-gandhi committed
65
66
67
68
69
  logging_strategy:
    value: steps
  logging_steps:
    value: 10
  evaluation_strategy:
sanchit-gandhi's avatar
sanchit-gandhi committed
70
71
    value: steps
  eval_steps:
sanchit-gandhi's avatar
sanchit-gandhi committed
72
    value: 2000
sanchit-gandhi's avatar
sanchit-gandhi committed
73
  save_strategy:
sanchit-gandhi's avatar
sanchit-gandhi committed
74
75
    value: steps
  save_steps:
sanchit-gandhi's avatar
sanchit-gandhi committed
76
    value: 2000
sanchit-gandhi's avatar
sanchit-gandhi committed
77
78
79
  metric_for_best_model:
    value: accuracy
  freeze_base_model:
sanchit-gandhi's avatar
sanchit-gandhi committed
80
    value: false
sanchit-gandhi's avatar
sanchit-gandhi committed
81
82
83
84
  push_to_hub:
    value: false
program: run_audio_classification.py
project: mms-lid-accent-classification