audio_config_8k.yaml 486 Bytes
Newer Older
liugh5's avatar
liugh5 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
# Audio processing configs

audio_config:
  # Preprocess
  wav_normalize: True
  trim_silence: True
  trim_silence_threshold_db: 60
  preemphasize: False

  # Feature extraction
  sampling_rate: 8000
  hop_length: 100
  win_length: 600
  n_fft: 2048
  n_mels: 80
  fmin: 0.0
  fmax: 4000.0
  phone_level_feature: True

  # Normalization
  norm_type: "mean_std"  # "mean_std" or "global"
  max_norm: 1.0
  symmetric: False
  min_level_db: -100.0
  ref_level_db: 20
  
  num_workers: 16