Dongchao commited on
Commit
ac13e2e
1 Parent(s): 14c4be6

Upload config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +172 -0
config.yaml ADDED
@@ -0,0 +1,172 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ generator:
2
+ name: ScalarModel
3
+ config:
4
+ num_bands: 1
5
+ sample_rate: 48000
6
+ causal: true
7
+ num_samples: 2
8
+ downsample_factors:
9
+ - 4
10
+ - 5
11
+ - 5
12
+ - 5
13
+ downsample_kernel_sizes:
14
+ - 8
15
+ - 10
16
+ - 10
17
+ - 10
18
+ upsample_factors:
19
+ - 5
20
+ - 5
21
+ - 5
22
+ - 4
23
+ upsample_kernel_sizes:
24
+ - 10
25
+ - 10
26
+ - 10
27
+ - 8
28
+ latent_hidden_dim: 32
29
+ default_kernel_size: 7
30
+ delay_kernel_size: 5
31
+ init_channel: 64
32
+ res_kernel_size: 7
33
+ d_list:
34
+ - mfd
35
+ mfd:
36
+ name: MultiFrequencyDiscriminator
37
+ config:
38
+ hop_lengths:
39
+ - 32
40
+ - 64
41
+ - 128
42
+ - 256
43
+ - 512
44
+ - 1024
45
+ hidden_channels:
46
+ - 64
47
+ - 128
48
+ - 256
49
+ - 512
50
+ - 512
51
+ - 512
52
+ domain: double
53
+ mel_scale: true
54
+ sample_rate: 48000
55
+ mpd:
56
+ name: MultiPeriodDiscriminator
57
+ config:
58
+ period_sizes:
59
+ - 2
60
+ - 3
61
+ - 5
62
+ - 7
63
+ - 11
64
+ period_kernel_size: 5
65
+ msd:
66
+ name: MultiScaleDiscriminator
67
+ config:
68
+ num_scales: 3
69
+ pool_kernel_size: 4
70
+ pool_stride: 2
71
+ optimizer:
72
+ g:
73
+ name: AdamW
74
+ config:
75
+ lr: 0.0002
76
+ betas:
77
+ - 0.8
78
+ - 0.99
79
+ eps: 1.0e-06
80
+ d:
81
+ name: AdamW
82
+ config:
83
+ lr: 0.0002
84
+ betas:
85
+ - 0.8
86
+ - 0.99
87
+ eps: 1.0e-06
88
+ lr_scheduler:
89
+ g:
90
+ name: ExponentialLR
91
+ config:
92
+ gamma: 0.999
93
+ d:
94
+ name: ExponentialLR
95
+ config:
96
+ gamma: 0.999
97
+ criterion:
98
+ g_criterion:
99
+ name: losses.generator_loss.GeneratorSTFTLoss
100
+ config:
101
+ use_mel_loss: false
102
+ adv_criterion: MSEGLoss
103
+ mel_loss_weight: 45
104
+ use_feature_match: true
105
+ feat_match_loss_weight: 20
106
+ use_full_stft_loss: true
107
+ use_sub_stft_loss: true
108
+ full_stft_loss_weight: 1
109
+ sub_stft_loss_weight: 1
110
+ mel_scale_loss:
111
+ sampling_rate: 48000
112
+ n_fft: 1024
113
+ num_mels: 80
114
+ hop_size: 160
115
+ win_size: 800
116
+ fmin: 0
117
+ full_multi_scale_stft_loss:
118
+ fft_sizes:
119
+ - 512
120
+ - 1024
121
+ - 2048
122
+ win_sizes:
123
+ - 480
124
+ - 960
125
+ - 1200
126
+ hop_sizes:
127
+ - 120
128
+ - 240
129
+ - 300
130
+ sub_multi_scale_stft_loss:
131
+ num_bands: 6
132
+ fft_sizes:
133
+ - 128
134
+ - 256
135
+ - 256
136
+ win_sizes:
137
+ - 80
138
+ - 120
139
+ - 200
140
+ hop_sizes:
141
+ - 20
142
+ - 40
143
+ - 50
144
+ d_criterion:
145
+ name: losses.discriminator_loss.MSEDiscriminatorLoss
146
+ config: null
147
+ commit_loss_weight: 1.0
148
+ training_file: train.scp
149
+ validation_file: val.scp
150
+ seed: 2333
151
+ cudnn_deterministic: false
152
+ tensorboard: true
153
+ checkpoint_interval: 5000
154
+ summary_interval: 100
155
+ validation_interval: 5000
156
+ num_epoches: 500
157
+ print_freq: 10
158
+ discriminator_iter_start: 0
159
+ num_ckpt_keep: 10
160
+ segment_size: 48000
161
+ audio_norm_scale: 0.95
162
+ batch_size: 12
163
+ num_workers: 8
164
+ num_plots: 8
165
+ local_rank: -1
166
+ basic_model_config: config/scalar48k.yaml
167
+ exp_model_config: null
168
+ log_dir: /apdcephfs/share_1316500/lavenywang/exp_data/codec/48k
169
+ hop_length: 2000
170
+ ngpus_per_node: 8
171
+ sample_rate: 48000
172
+ model_ckpt_dir: /apdcephfs/share_1316500/lavenywang/exp_data/codec/48k/model_ckpts