run_mms_lid.sh 1.17 KB
Newer Older
sanchit-gandhi's avatar
sanchit-gandhi committed
1
2
3
4
#!/usr/bin/env bash

python run_audio_classification.py \
    --model_name_or_path "facebook/mms-lid-126" \
sanchit-gandhi's avatar
sanchit-gandhi committed
5
6
7
8
9
    --train_dataset_name "stable-speech/concatenated-accent-dataset" \
    --train_dataset_config_name "default" \
    --train_split_name "train" \
    --train_label_column_name "labels" \
    --eval_dataset_name "stable-speech/concatenated-accent-dataset" \
sanchit-gandhi's avatar
sanchit-gandhi committed
10
11
    --eval_dataset_config_name "default" \
    --eval_split_name "test" \
sanchit-gandhi's avatar
sanchit-gandhi committed
12
    --eval_label_column_name "labels" \
sanchit-gandhi's avatar
sanchit-gandhi committed
13
14
15
16
17
18
    --output_dir "./" \
    --do_train \
    --do_eval \
    --overwrite_output_dir \
    --remove_unused_columns False \
    --fp16 \
sanchit-gandhi's avatar
sanchit-gandhi committed
19
    --fp16_full_eval \
sanchit-gandhi's avatar
sanchit-gandhi committed
20
    --learning_rate 1e-4 \
sanchit-gandhi's avatar
sanchit-gandhi committed
21
    --max_length_seconds 20 \
sanchit-gandhi's avatar
sanchit-gandhi committed
22
23
24
25
    --min_length_seconds 5 \
    --attention_mask \
    --warmup_steps 100 \
    --max_steps 1000 \
sanchit-gandhi's avatar
sanchit-gandhi committed
26
27
    --per_device_train_batch_size 32 \
    --per_device_eval_batch_size 32 \
sanchit-gandhi's avatar
sanchit-gandhi committed
28
    --preprocessing_num_workers 4 \
sanchit-gandhi's avatar
sanchit-gandhi committed
29
30
31
    --dataloader_num_workers 4 \
    --logging_strategy "steps" \
    --logging_steps 10 \
sanchit-gandhi's avatar
sanchit-gandhi committed
32
33
34
35
36
37
    --evaluation_strategy "steps" \
    --eval_steps 500 \
    --save_strategy "steps" \
    --save_steps 1000 \
    --freeze_base_model False \
    --push_to_hub False \
sanchit-gandhi's avatar
sanchit-gandhi committed
38
    --trust_remote_code