run_sweep.yaml 1.71 KB
Newer Older
sanchit-gandhi's avatar
sanchit-gandhi committed
1
2
3
4
5
6
7
8
9
command:
  - python3
  - ${program}
  - --load_best_model_at_end
  - --fp16
  - --do_train
  - --do_eval
  - --trust_remote_code
  - --overwrite_output_dir
sanchit-gandhi's avatar
sanchit-gandhi committed
10
  - --ignore_mismatched_sizes
sanchit-gandhi's avatar
sanchit-gandhi committed
11
12
13
  - ${args}
method: grid
metric:
sanchit-gandhi's avatar
sanchit-gandhi committed
14
  goal: maximize
sanchit-gandhi's avatar
sanchit-gandhi committed
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
  name: eval/accuracy
parameters:
  model_name_or_path:
    values:
      - facebook/mms-lid-126
      - openai/whisper-large-v3
      - facebook/w2v-bert-2.0
  train_dataset_name:
    value: sanchit-gandhi/vctk+facebook/voxpopuli+sanchit-gandhi/edacc
  train_dataset_config_name:
    value: default+en_accented+default
  train_split_name:
    value: train+test+validation
  train_label_column_name:
    value: accent+accent+accent
  eval_dataset_name:
    value: sanchit-gandhi/edacc
  eval_dataset_config_name:
    value: default
  eval_split_name:
    value: test
  eval_label_column_name:
    value: accent
  output_dir:
    value: ./
  remove_unused_columns:
    value: false
  learning_rate:
    value: 1e-4
sanchit-gandhi's avatar
sanchit-gandhi committed
44
45
  lr_scheduler_type:
    value: constant_with_warmup
sanchit-gandhi's avatar
sanchit-gandhi committed
46
47
  max_length_seconds:
    value: 20
sanchit-gandhi's avatar
sanchit-gandhi committed
48
49
  min_length_seconds:
    value: 5
sanchit-gandhi's avatar
sanchit-gandhi committed
50
51
  attention_mask:
    value: false
sanchit-gandhi's avatar
sanchit-gandhi committed
52
53
54
55
  warmup_steps:
    value: 50
  max_steps:
    value: 1000
sanchit-gandhi's avatar
sanchit-gandhi committed
56
57
58
59
60
61
62
  per_device_train_batch_size:
    value: 32
  per_device_eval_batch_size:
    value: 32
  preprocessing_num_workers:
    value: 16
  dataloader_num_workers:
sanchit-gandhi's avatar
sanchit-gandhi committed
63
    value: 8
sanchit-gandhi's avatar
sanchit-gandhi committed
64
65
66
67
68
  logging_strategy:
    value: steps
  logging_steps:
    value: 10
  evaluation_strategy:
sanchit-gandhi's avatar
sanchit-gandhi committed
69
70
71
    value: steps
  eval_steps:
    value: 1000
sanchit-gandhi's avatar
sanchit-gandhi committed
72
  save_strategy:
sanchit-gandhi's avatar
sanchit-gandhi committed
73
74
75
    value: steps
  save_steps:
    value: 1000
sanchit-gandhi's avatar
sanchit-gandhi committed
76
77
78
79
80
81
82
83
84
85
  metric_for_best_model:
    value: accuracy
  freeze_base_model:
    values:
      - true
      - false
  push_to_hub:
    value: false
program: run_audio_classification.py
project: mms-lid-accent-classification