Spaces:

vishred18
/

Comparative-Analysis-of-Speech-Synthesis-Models

Build error

Upload 364 files

d5ee97c about 2 years ago

1.08 kB

	###########################################################
	# FEATURE EXTRACTION SETTING #
	###########################################################
	sampling_rate: 44100 # Sampling rate.
	fft_size: 2048 # FFT size.
	hop_size: 512 # Hop size. (fixed value, don't change)
	win_length: 2048 # Window length.
	# If set to null, it will be the same as fft_size.
	window: "hann" # Window function.
	num_mels: 80 # Number of mel basis.
	fmin: 20 # Minimum freq in mel basis calculation.
	fmax: 11025 # Maximum frequency in mel basis calculation.
	global_gain_scale: 1.0 # Will be multiplied to all of waveform.
	trim_silence: false # Whether to trim the start and end of silence
	trim_threshold_in_db: 60 # Need to tune carefully if the recording is not good.
	trim_frame_size: 2048 # Frame size in trimming.
	trim_hop_size: 512 # Hop size in trimming.
	format: "npy" # Feature file format. Only "npy" is supported.
	trim_mfa: false