"...composable_kernel.git" did not exist on "0a8087248b09e88cb3799b88cce10fd4c5c9a7da"
Commit 64cfa64e authored by Yoach Lacombe's avatar Yoach Lacombe
Browse files

update audio classification script

parent 10ef6f6c
#!/usr/bin/env bash #!/usr/bin/env bash
python run_audio_classification.py \ CUDA_VISIBLE_DEVICES=2 python run_audio_classification_one_layer.py \
--model_name_or_path "facebook/mms-lid-126" \ --model_name_or_path "facebook/mms-lid-4017" \
--train_dataset_name "stable-speech/concatenated-normalized-accent-dataset" \ --train_dataset_name "stable-speech/concatenated-normalized-accent-dataset" \
--train_dataset_config_name "default" \ --train_dataset_config_name "default" \
--train_split_name "train" \ --train_split_name "train" \
...@@ -10,11 +10,11 @@ python run_audio_classification.py \ ...@@ -10,11 +10,11 @@ python run_audio_classification.py \
--eval_dataset_config_name "default" \ --eval_dataset_config_name "default" \
--eval_split_name "test" \ --eval_split_name "test" \
--eval_label_column_name "labels" \ --eval_label_column_name "labels" \
--output_dir "./" \ --output_dir "./tmp/" \
--do_train \ --do_train \
--do_eval \ --do_eval \
--overwrite_output_dir \ --overwrite_output_dir \
--remove_unused_columns False \ --remove_unused_columns false \
--fp16 \ --fp16 \
--fp16_full_eval \ --fp16_full_eval \
--learning_rate 1e-4 \ --learning_rate 1e-4 \
...@@ -30,9 +30,11 @@ python run_audio_classification.py \ ...@@ -30,9 +30,11 @@ python run_audio_classification.py \
--logging_strategy "steps" \ --logging_strategy "steps" \
--logging_steps 10 \ --logging_steps 10 \
--evaluation_strategy "steps" \ --evaluation_strategy "steps" \
--eval_steps 500 \ --eval_steps 300 \
--save_strategy "no" \ --save_strategy "no" \
--save_steps 2000 \ --save_steps 2000 \
--freeze_base_model True \ --freeze_base_model true \
--push_to_hub False \ --freeze_feature_encoder true \
--trust_remote_code --push_to_hub false \
--trust_remote_code \
--use_weighted_layer_sum true \
command: command:
- python3 - python3
- ${program} - ${program}
- --load_best_model_at_end
- --fp16 - --fp16
- --fp16_full_eval - --fp16_full_eval
- --do_train - --do_train
- --do_eval - --do_eval
- --trust_remote_code - --trust_remote_code
- --overwrite_output_dir - --overwrite_output_dir
- --ignore_mismatched_sizes
- --gradient_checkpointing
- ${args} - ${args}
method: grid method: random
metric: metric:
goal: maximize goal: maximize
name: eval/accuracy name: eval/accuracy
parameters: parameters:
model_name_or_path: model_name_or_path:
value: facebook/mms-lid-126 value: facebook/mms-lid-4017
train_dataset_name: train_dataset_name:
value: stable-speech/concatenated-accent-dataset value: "stable-speech/concatenated-normalized-accent-dataset+stable-speech/concatenated-common-voice-15-accented"
train_dataset_config_name: train_dataset_config_name:
value: default value: "default+default"
train_split_name: train_split_name:
value: train value: "train+train"
train_label_column_name: train_label_column_name:
value: labels value: "labels+labels"
eval_dataset_name: eval_dataset_name:
value: stable-speech/concatenated-accent-dataset value: stable-speech/concatenated-normalized-accent-dataset
eval_dataset_config_name: eval_dataset_config_name:
value: default value: default
eval_split_name: eval_split_name:
...@@ -35,31 +32,38 @@ parameters: ...@@ -35,31 +32,38 @@ parameters:
eval_label_column_name: eval_label_column_name:
value: labels value: labels
output_dir: output_dir:
value: ./ value: "/raid/yoach/tmp/"
remove_unused_columns: remove_unused_columns:
value: false value: false
learning_rate: learning_rate:
value: 1e-4 distribution: log_uniform_values
min: 3e-6
max: 0.01
lr_scheduler_type: lr_scheduler_type:
value: constant_with_warmup value: constant
max_length_seconds: max_length_seconds:
value: 20 # give some data diversity for longer audio samples value: 20 # give some data diversity for longer audio samples
min_length_seconds: min_length_seconds:
value: 7 value: 5
attention_mask: attention_mask:
value: true values:
warmup_steps: - true
value: 100 num_train_epochs:
max_steps: values:
value: 2000 - 2
- 5
- 10
- 20
- 40
- 60
per_device_train_batch_size: per_device_train_batch_size:
value: 32 value: 32
per_device_eval_batch_size: per_device_eval_batch_size:
value: 16 value: 32
preprocessing_num_workers: preprocessing_num_workers:
value: 4 value: 8
dataloader_num_workers: dataloader_num_workers:
value: 4 value: 8
logging_strategy: logging_strategy:
value: steps value: steps
logging_steps: logging_steps:
...@@ -67,20 +71,28 @@ parameters: ...@@ -67,20 +71,28 @@ parameters:
evaluation_strategy: evaluation_strategy:
value: steps value: steps
eval_steps: eval_steps:
value: 1000 value: 2000
save_strategy: save_strategy:
value: steps value: "no"
save_steps: save_steps:
value: 2000 value: 2000
metric_for_best_model: metric_for_best_model:
value: accuracy value: accuracy
freeze_base_model:
values:
- false
- true
group_by_length:
value: false # TODO(SG): batch by length
push_to_hub: push_to_hub:
value: false value: false
use_weighted_layer_sum:
value: false
freeze_base_model:
value: true
max_samples_per_label:
value: 10000
save_to_disk:
value: "/raid/yoach/tmp_dataset_accents/"
temporary_save_to_disk:
value: "/raid/yoach/tmp_hidden_states/"
use_last_embedding_layer:
value: true
filter_threshold:
value: "0.001"
program: run_audio_classification.py program: run_audio_classification.py
project: mms-lid-accent-classification project: mms-lid-accent-classification-v2
\ No newline at end of file
This diff is collapsed.
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment