forked from TensorSpeech/TensorFlowTTS
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathjsut_preprocess.yaml
19 lines (18 loc) · 1.04 KB
/
jsut_preprocess.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
###########################################################
# FEATURE EXTRACTION SETTING #
###########################################################
sampling_rate: 24000 # Sampling rate.
fft_size: 2048 # FFT size.
hop_size: 300 # Hop size. (fixed value, don't change)
win_length: 1200 # Window length.
# If set to null, it will be the same as fft_size.
window: "hann" # Window function.
num_mels: 80 # Number of mel basis.
fmin: 80 # Minimum freq in mel basis calculation.
fmax: 7600 # Maximum frequency in mel basis calculation.
global_gain_scale: 1.0 # Will be multiplied to all of waveform.
trim_silence: true # Whether to trim the start and end of silence.
trim_threshold_in_db: 60 # Need to tune carefully if the recording is not good.
trim_frame_size: 2048 # Frame size in trimming.
trim_hop_size: 512 # Hop size in trimming.
format: "npy" # Feature file format. Only "npy" is supported.