Upload ljspeech_transformer_tts_aept/config.yml with huggingface_hub
Browse files
ljspeech_transformer_tts_aept/config.yml
ADDED
@@ -0,0 +1,151 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
additional_config: conf/tts_aept.v1.yaml
|
2 |
+
allow_cache: true
|
3 |
+
batch_size: 100
|
4 |
+
cleaner: tacotron
|
5 |
+
config: exp/tts_aept_phn_tacotron_lr8e-04_wu4k_r2_eos_bs128_checkpoint-86000steps/original_config.yaml
|
6 |
+
dev_dumpdir: dump/dev/norm
|
7 |
+
dev_text: data/dev/text
|
8 |
+
distributed: false
|
9 |
+
eval_interval_steps: 100
|
10 |
+
fft_size: 1024
|
11 |
+
fmax: 7600
|
12 |
+
fmin: 80
|
13 |
+
format: hdf5
|
14 |
+
freeze-mods:
|
15 |
+
- decoder
|
16 |
+
- feat_out
|
17 |
+
- prob_out
|
18 |
+
- postnet
|
19 |
+
g2p: g2p_en
|
20 |
+
global_gain_scale: 0.95
|
21 |
+
grad_norm: 1.0
|
22 |
+
hop_size: 256
|
23 |
+
inference:
|
24 |
+
maxlenratio: 2.0
|
25 |
+
minlenratio: 0.0
|
26 |
+
threshold: 0.5
|
27 |
+
init-mods:
|
28 |
+
- decoder
|
29 |
+
- feat_out
|
30 |
+
- prob_out
|
31 |
+
- postnet
|
32 |
+
init_checkpoint: exp/tts_aept_phn_tacotron_lr8e-04_wu4k_r2_eos_bs128_checkpoint-86000steps/original_checkpoint-86000steps.pkl
|
33 |
+
log_interval_steps: 10
|
34 |
+
model_params:
|
35 |
+
adim: 384
|
36 |
+
aheads: 4
|
37 |
+
decoder_concat_after: false
|
38 |
+
decoder_normalize_before: false
|
39 |
+
decoder_reduction_factor: 2
|
40 |
+
dlayers: 6
|
41 |
+
dprenet_layers: 2
|
42 |
+
dprenet_units: 256
|
43 |
+
dunits: 1536
|
44 |
+
elayers: 6
|
45 |
+
encoder_concat_after: false
|
46 |
+
encoder_normalize_before: true
|
47 |
+
eunits: 1536
|
48 |
+
idim: 80
|
49 |
+
odim: 80
|
50 |
+
postnet_chans: 256
|
51 |
+
postnet_filts: 5
|
52 |
+
postnet_layers: 5
|
53 |
+
use_batch_norm: true
|
54 |
+
model_type: VTN
|
55 |
+
non_linguistic_symbols: none
|
56 |
+
num_mels: 80
|
57 |
+
num_save_intermediate_results: 4
|
58 |
+
num_workers: 2
|
59 |
+
optimizer_params:
|
60 |
+
lr: 0.0008
|
61 |
+
optimizer_type: Adam
|
62 |
+
outdir: exp/tts_aept_phn_tacotron_lr8e-04_wu4k_r2_eos_bs128_checkpoint-86000steps
|
63 |
+
pin_memory: true
|
64 |
+
pretrain: ''
|
65 |
+
rank: 0
|
66 |
+
resume: ''
|
67 |
+
sampling_rate: 16000
|
68 |
+
save_interval_steps: 1000
|
69 |
+
scheduler: warmuplr
|
70 |
+
scheduler_params:
|
71 |
+
warmup_steps: 4000
|
72 |
+
seq2seq_loss_params:
|
73 |
+
bce_pos_weight: 10.0
|
74 |
+
src_dev_dumpdir: dump/dev/norm
|
75 |
+
src_feat_type: mel
|
76 |
+
src_train_dumpdir: dump/train_no_dev/norm
|
77 |
+
stats:
|
78 |
+
mean: !!python/object/apply:numpy.core.multiarray._reconstruct
|
79 |
+
args:
|
80 |
+
- &id001 !!python/name:numpy.ndarray ''
|
81 |
+
- !!python/tuple
|
82 |
+
- 0
|
83 |
+
- !!binary |
|
84 |
+
Yg==
|
85 |
+
state: !!python/tuple
|
86 |
+
- 1
|
87 |
+
- !!python/tuple
|
88 |
+
- 80
|
89 |
+
- &id002 !!python/object/apply:numpy.dtype
|
90 |
+
args:
|
91 |
+
- f4
|
92 |
+
- false
|
93 |
+
- true
|
94 |
+
state: !!python/tuple
|
95 |
+
- 3
|
96 |
+
- <
|
97 |
+
- null
|
98 |
+
- null
|
99 |
+
- null
|
100 |
+
- -1
|
101 |
+
- -1
|
102 |
+
- 0
|
103 |
+
- false
|
104 |
+
- !!binary |
|
105 |
+
uCcJwJgR6b8mW8i/AqbEvxauxr+NKse/N6jHvytBx7/vdse/HKm6vwDiu79Uqb2/p0TDvxdgy78k
|
106 |
+
kte/Xd7dv+GN4L/PK+e/Mejvv2Uc+b8aqgHAqXwGwPwDCMCsKQnAc2UKwMtPDMCAfQzAZw0RwABs
|
107 |
+
EsDMIhXA8fgXwJSCGsAm8xvAlWAdwDikHcBZyRrA8G0YwAXmFcCKGhXA9iYUwCbUEsBLwxHA3QcU
|
108 |
+
wJIXF8C7+BrAKSQewBa5IMARwyHAJAwhwB6dIMDxHh/AvbUdwM1mG8CfQRnAvOUYwFuOGsD58hzA
|
109 |
+
43sewA1aH8CKqx7Aw8sdwJYFHsCw9x7A8SAhwOs6I8Bf7CTAx5UmwBgVKMAZYCnABEMtwMzxM8BD
|
110 |
+
qTvAJm9BwOxVRcAt2EXA1eJEwKxhQcCR7jvAbdQ4wE6NRMA=
|
111 |
+
scale: !!python/object/apply:numpy.core.multiarray._reconstruct
|
112 |
+
args:
|
113 |
+
- *id001
|
114 |
+
- !!python/tuple
|
115 |
+
- 0
|
116 |
+
- !!binary |
|
117 |
+
Yg==
|
118 |
+
state: !!python/tuple
|
119 |
+
- 1
|
120 |
+
- !!python/tuple
|
121 |
+
- 80
|
122 |
+
- *id002
|
123 |
+
- false
|
124 |
+
- !!binary |
|
125 |
+
DP3YPtefJj/bkUY/XPhDP5TSNz+WMjY/rUpGP3CyTD9GiE0/VthAPzDZQj8p0EI/5f1EP764QD94
|
126 |
+
ZEA/ReZCPwz8Qz95UUI/NkNAPzNtPz9gUUU/bHZEP0JDQz/oekU/+XtFP+rMQz8MWkA/Vo1AP5eL
|
127 |
+
Pz/urDs/lF4+PzP4QD8Of0E/dX5AP9byPj/JPzw/8Iw8P2qIPj+1tD8/o6BAP/UWQT9askA/13k+
|
128 |
+
P9vaOj9uMjg/Nws3P9FUNz+lWjg/a+c7P7LtQD8AIkM/ED1FP91FRT9RiEc/N5NKP9GBRz8qz0E/
|
129 |
+
0lo8Pz+DOT9Kzzo//qo8PwrzPT/e8EA/4PtEP74YSD+z00g/MLlIP++vSj/ZnE4/nvVSPzduVz+G
|
130 |
+
VF4/q8llP9/lbT+d4HE/+wxvPz0JbT+6Um0/kXJuP580bz8=
|
131 |
+
token_list: exp/phn_tacotron_lr8e-04_wu4k_r2_eos_bs128/tokens.txt
|
132 |
+
token_type: phn
|
133 |
+
train_dumpdir: dump/train_no_dev/norm
|
134 |
+
train_max_steps: 50000
|
135 |
+
train_text: data/train_no_dev/text
|
136 |
+
trg_dev_dumpdir: dump/dev/norm
|
137 |
+
trg_feat_type: mel
|
138 |
+
trg_stats: exp/tts_aept_phn_tacotron_lr8e-04_wu4k_r2_eos_bs128_checkpoint-86000steps/stats.h5
|
139 |
+
trg_train_dumpdir: dump/train_no_dev/norm
|
140 |
+
trim_frame_size: 2048
|
141 |
+
trim_hop_size: 512
|
142 |
+
trim_silence: false
|
143 |
+
trim_threshold_in_db: 60
|
144 |
+
verbose: 1
|
145 |
+
version: 0.1.0
|
146 |
+
vocoder: null
|
147 |
+
win_length: null
|
148 |
+
window: hann
|
149 |
+
feat_list:
|
150 |
+
mel: {}
|
151 |
+
trg_feat: "mel"
|