-
Notifications
You must be signed in to change notification settings - Fork 3
/
config.yml
50 lines (44 loc) · 1.06 KB
/
config.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
# Contains model configs.
mel_channels: &mel_channels 80
trainer:
sampling_rate: &sampling_rate 22050
mu_law: true
audio_generator:
_target_: models.AudioGenerator
align_gamma: 10.0
encoder_layers: 12
encoder_channels: 256
decoder_scales: [1, 1, 2, 3, 3, 5]
decoder_channels: 512
latent_channels: 128
kernel_size: 3
audio_discriminator:
_target_: models.AudioDiscriminator
windows: [200, 400, 800, 1600, 3200]
n_layers: 3
base_channels: 64
kernel_size: 3
spect_discriminator:
_target_: models.SpectrogramDiscriminator
n_discs: 3
n_layers: 3
mel_channels: *mel_channels
base_channels: 64
kernel_size: 3
spect_fn:
_target_: modules.mel.MelSpectrogram
filter_length: 1024
hop_length: 256
win_length: 1024
n_mels: *mel_channels
sampling_rate: *sampling_rate
mel_fmin: 0.
mel_fmax: 8000.
window: hann
sdtw_fn:
_target_: modules.sdtw.SoftDynamicTimeWarping
gamma: 0.01
penalty: 1.0
normalize: false
bandwidth: null
dist_func: manhattan