Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
chenpangpang
parler-tts
Commits
b6341055
Commit
b6341055
authored
Feb 21, 2024
by
Yoach Lacombe
Browse files
write first version of training script + example config
parent
813df4d2
Changes
2
Expand all
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
1077 additions
and
0 deletions
+1077
-0
example_configs/librispeech_tts_r.json
example_configs/librispeech_tts_r.json
+63
-0
run_stable_speech_training.py
run_stable_speech_training.py
+1014
-0
No files found.
example_configs/librispeech_tts_r.json
0 → 100644
View file @
b6341055
{
"model_name_or_path"
:
"ylacombe/musicgen-melody"
,
"push_to_hub"
:
false
,
"hub_model_id"
:
"stable-speech-mini"
,
"report_to"
:
[
"wandb"
],
"overwrite_output_dir"
:
true
,
"output_dir"
:
"/home/yoach/dataspeech/artefacts/training/"
,
"train_dataset_name"
:
"blabble-io/libritts_r+blabble-io/libritts_r+blabble-io/libritts_r"
,
"train_metadata_dataset_name"
:
"stable-speech/libritts-r-tags-and-text-generated+stable-speech/libritts-r-tags-and-text-generated+stable-speech/libritts-r-tags-and-text-generated"
,
"train_dataset_config_name"
:
"clean+clean+other"
,
"train_split_name"
:
"train.clean.360+train.clean.100+train.other.500"
,
"eval_dataset_name"
:
"blabble-io/libritts_r+blabble-io/libritts_r"
,
"eval_metadata_dataset_name"
:
"stable-speech/libritts-r-tags-and-text-generated+stable-speech/libritts-r-tags-and-text-generated"
,
"eval_dataset_config_name"
:
"clean+other"
,
"eval_split_name"
:
"test.clean+test.other"
,
"target_audio_column_name"
:
"audio"
,
"description_column_name"
:
"text"
,
"prompt_column_name"
:
"text_description"
,
"max_train_samples"
:
1000
,
"max_eval_samples"
:
200
,
"max_duration_in_seconds"
:
20
,
"min_duration_in_seconds"
:
1.0
,
"add_audio_samples_to_wandb"
:
true
,
"id_column_name"
:
"id"
,
"preprocessing_num_workers"
:
24
,
"pad_token_id"
:
2048
,
"decoder_start_token_id"
:
2048
,
"do_train"
:
true
,
"num_train_epochs"
:
20
,
"gradient_accumulation_steps"
:
1
,
"gradient_checkpointing"
:
true
,
"per_device_train_batch_size"
:
2
,
"learning_rate"
:
1e-6
,
"adam_beta1"
:
0.9
,
"adam_beta2"
:
0.95
,
"weight_decay"
:
0.1
,
"logging_steps"
:
25
,
"do_eval"
:
true
,
"predict_with_generate"
:
true
,
"include_inputs_for_metrics"
:
true
,
"evaluation_strategy"
:
"epoch"
,
"per_device_eval_batch_size"
:
2
,
"generation_max_length"
:
400
,
"fp16"
:
true
,
"seed"
:
456
,
"dataloader_num_workers"
:
8
}
run_stable_speech_training.py
0 → 100644
View file @
b6341055
This diff is collapsed.
Click to expand it.
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment