update

51782715 · liugh5 · 8b4e9acd · 8b4e9acd · 8b4e9acd · 8b4e9acd
Commit 51782715 authored Feb 23, 2024 by liugh5
20 changed files
--- a/kantts/configs/sambert_se_nsf_global_16k.yaml
+++ b/kantts/configs/sambert_se_nsf_global_16k.yaml
-model_type: sambert
-Model:
-#########################################################
-#         SAMBERT NETWORK ARCHITECTURE SETTING          #
-#########################################################
-  KanTtsSAMBERT:
-    params:
-        max_len: 800
-
-        embedding_dim: 512 
-        encoder_num_layers: 8
-        encoder_num_heads: 8
-        encoder_num_units: 128
-        encoder_ffn_inner_dim: 1024
-        encoder_dropout: 0.1
-        encoder_attention_dropout: 0.1
-        encoder_relu_dropout: 0.1
-        encoder_projection_units: 32
-
-        speaker_units: 192
-        emotion_units: 32
-
-        predictor_filter_size: 41
-        predictor_fsmn_num_layers: 3
-        predictor_num_memory_units: 128
-        predictor_ffn_inner_dim: 256
-        predictor_dropout: 0.1
-        predictor_shift: 0
-        predictor_lstm_units: 128
-        dur_pred_prenet_units: [128, 128]
-        dur_pred_lstm_units: 128
-
-        decoder_prenet_units: [256, 256]
-        decoder_num_layers: 12
-        decoder_num_heads: 8
-        decoder_num_units: 128
-        decoder_ffn_inner_dim: 1024
-        decoder_dropout: 0.1
-        decoder_attention_dropout: 0.1
-        decoder_relu_dropout: 0.1
-
-        outputs_per_step: 3
-        num_mels: 82
-
-        postnet_filter_size: 41
-        postnet_fsmn_num_layers: 4
-        postnet_num_memory_units: 256
-        postnet_ffn_inner_dim: 512
-        postnet_dropout: 0.1
-        postnet_shift: 17
-        postnet_lstm_units: 128
-        MAS: False
-        NSF: True
-        nsf_norm_type: global 
-        nsf_f0_global_minimum: 30.0
-        nsf_f0_global_maximum: 730.0            
-        SE: True
-
-
-    optimizer:
-      type: Adam
-      params:
-        lr: 0.001
-        betas: [0.9, 0.98]
-        eps: 1.0e-9
-        weight_decay: 0.0
-    scheduler:
-      type: NoamLR
-      params:
-        warmup_steps: 4000
-
-linguistic_unit: 
-  cleaners: english_cleaners
-  lfeat_type_list: sy,tone,syllable_flag,word_segment,emo_category,speaker_category
-  speaker_list: F7
-####################################################
-#                   LOSS SETTING                   #
-####################################################
-Loss:
-  MelReconLoss:
-    enable: True
-    params:
-      loss_type: mae
-
-  ProsodyReconLoss:
-    enable: True
-    params:
-      loss_type: mae
-
-###########################################################
-#                  DATA LOADER SETTING                    #
-###########################################################
-batch_size: 32              
-pin_memory: False            
-num_workers: 4 # FIXME: set > 0 may stuck on macos              
-remove_short_samples: False 
-allow_cache: False           
-grad_norm: 1.0
-
-###########################################################
-#                    INTERVAL SETTING                     #
-###########################################################
-train_max_steps: 1760101           # Number of training steps.
-save_interval_steps: 100        # Interval steps to save checkpoint.
-eval_interval_steps: 1000000000000          # Interval steps to evaluate the network. 
-log_interval_steps: 10           # Interval steps to record the training log.
-
-###########################################################
-#                     OTHER SETTING                       #
-###########################################################
-num_save_intermediate_results: 4  # Number of results to be saved as intermediate results.
--- a/kantts/configs/sambert_se_nsf_global_24k.yaml
+++ b/kantts/configs/sambert_se_nsf_global_24k.yaml
--- a/kantts/configs/sambert_sichuan_16k.yaml
+++ b/kantts/configs/sambert_sichuan_16k.yaml
--- a/kantts/configs/sybert.yaml
+++ b/kantts/configs/sybert.yaml
-model_type: sybert
-Model:
-#########################################################
-#         TextsyBERT NETWORK ARCHITECTURE SETTING          #
-#########################################################
-  KanTtsTextsyBERT:
-    params:
-        max_len: 800
-
-        embedding_dim: 512
-        encoder_num_layers: 8
-        encoder_num_heads: 8
-        encoder_num_units: 128
-        encoder_ffn_inner_dim: 1024
-        encoder_dropout: 0.1
-        encoder_attention_dropout: 0.1
-        encoder_relu_dropout: 0.1
-        encoder_projection_units: 32
-        
-        mask_ratio: 0.3
-
-    optimizer:
-      type: Adam
-      params:
-        lr: 0.0001
-        betas: [0.9, 0.98]
-        eps: 1.0e-9
-        weight_decay: 0.0
-    scheduler:
-      type: NoamLR
-      params:
-        warmup_steps: 10000
-
-linguistic_unit:
-  cleaners: english_cleaners
-  lfeat_type_list: sy,tone,syllable_flag,word_segment,emo_category,speaker_category
-  speaker_list: F7
-####################################################
-#                   LOSS SETTING                   #
-####################################################
-Loss:
-  SeqCELoss:
-    enable: True
-    params:
-      loss_type: ce
-
-###########################################################
-#                  DATA LOADER SETTING                    #
-###########################################################
-batch_size: 32
-pin_memory: False
-num_workers: 4 # FIXME: set > 0 may stuck on macos
-remove_short_samples: False
-allow_cache: True
-
-grad_norm: 1.0
-
-###########################################################
-#                    INTERVAL SETTING                     #
-###########################################################
-train_max_steps: 1000000           # Number of training steps.
-save_interval_steps: 20000         # Interval steps to save checkpoint.
-eval_interval_steps: 10000          # Interval steps to evaluate the network.
-log_interval_steps: 1000            # Interval steps to record the training log.
-
-###########################################################
-#                     OTHER SETTING                       #
-###########################################################
-num_save_intermediate_results: 4  # Number of results to be saved as intermediate results.
--- a/kantts/datasets/__init__.py
+++ b/kantts/datasets/__init__.py
--- a/kantts/datasets/__pycache__/__init__.cpython-38.pyc
+++ b/kantts/datasets/__pycache__/__init__.cpython-38.pyc
--- a/kantts/datasets/__pycache__/dataset.cpython-38.pyc
+++ b/kantts/datasets/__pycache__/dataset.cpython-38.pyc
--- a/kantts/datasets/data_types.py
+++ b/kantts/datasets/data_types.py
--- a/kantts/datasets/dataset.py
+++ b/kantts/datasets/dataset.py
--- a/kantts/models/__init__.py
+++ b/kantts/models/__init__.py
--- a/kantts/models/__pycache__/__init__.cpython-38.pyc
+++ b/kantts/models/__pycache__/__init__.cpython-38.pyc
--- a/kantts/models/__pycache__/pqmf.cpython-38.pyc
+++ b/kantts/models/__pycache__/pqmf.cpython-38.pyc
--- a/kantts/models/__pycache__/utils.cpython-38.pyc
+++ b/kantts/models/__pycache__/utils.cpython-38.pyc
--- a/kantts/models/hifigan/__pycache__/hifigan.cpython-38.pyc
+++ b/kantts/models/hifigan/__pycache__/hifigan.cpython-38.pyc
--- a/kantts/models/hifigan/__pycache__/layers.cpython-38.pyc
+++ b/kantts/models/hifigan/__pycache__/layers.cpython-38.pyc
--- a/kantts/models/hifigan/hifigan.py
+++ b/kantts/models/hifigan/hifigan.py
--- a/kantts/models/hifigan/layers.py
+++ b/kantts/models/hifigan/layers.py
--- a/kantts/models/pqmf.py
+++ b/kantts/models/pqmf.py
--- a/kantts/models/sambert/__init__.py
+++ b/kantts/models/sambert/__init__.py
--- a/kantts/models/sambert/__pycache__/__init__.cpython-38.pyc
+++ b/kantts/models/sambert/__pycache__/__init__.cpython-38.pyc