File size: 5,521 Bytes
885eaab
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
additional_config: conf/vtn.tts_pt.v1.ppg_sxliu.yaml
allow_cache: true
batch_size: 16
cleaner: tacotron
collater_type: ARVCCollater
config: exp/TXHC_bdl_1032_debug/original_config.yml
criterions:
  Seq2SeqLoss:
    bce_pos_weight: 10.0
dev_dp_input_dir: null
dev_dumpdir: dump/dev/ppg_sxliu_norm
dev_duration_dir: null
dev_text: data/dev/text
distributed: false
eval_interval_steps: 500
feat_type: ppg_sxliu
fft_size: 1024
fmax: 7600
fmin: 80
format: hdf5
freeze-mods: null
g2p: g2p_en
global_gain_scale: 1.0
grad_norm: 1.0
hop_size: 256
inference:
  maxlenratio: 6.0
  minlenratio: 0.0
  threshold: 0.5
init-mods:
- encoder
- decoder
- feat_out
- prob_out
- postnet
init_checkpoint: exp/TXHC_bdl_1032_debug/original_checkpoint-50000steps.pkl
log_interval_steps: 10
model_params:
  adim: 384
  aheads: 4
  decoder_concat_after: false
  decoder_normalize_before: false
  decoder_reduction_factor: 2
  dlayers: 6
  dprenet_layers: 2
  dprenet_units: 256
  dunits: 1536
  elayers: 6
  encoder_concat_after: false
  encoder_normalize_before: true
  eunits: 1536
  idim: 144
  odim: 144
  postnet_chans: 256
  postnet_filts: 5
  postnet_layers: 5
  use_batch_norm: true
model_type: VTN
non_linguistic_symbols: none
num_mels: 80
num_save_intermediate_results: 4
num_workers: 2
optimizer_params:
  lr: 8.0e-05
optimizer_type: Adam
outdir: exp/TXHC_bdl_1032_debug
pin_memory: true
pretrain: ''
rank: 0
resume: ''
sampling_rate: 16000
save_interval_steps: 1000
scheduler: warmuplr
scheduler_params:
  warmup_steps: 4000
seq2seq_loss_params:
  bce_pos_weight: 10.0
src_dev_dumpdir: dump/TXHC_dev/ppg_sxliu/norm_ljspeech
src_feat_type: ppg_sxliu
src_train_dumpdir: dump/TXHC_train_1032/ppg_sxliu/norm_ljspeech
stats:
  mean: !!python/object/apply:numpy.core.multiarray._reconstruct
    args:
    - &id001 !!python/name:numpy.ndarray ''
    - !!python/tuple
      - 0
    - !!binary |
      Yg==
    state: !!python/tuple
    - 1
    - !!python/tuple
      - 144
    - &id002 !!python/object/apply:numpy.dtype
      args:
      - f4
      - false
      - true
      state: !!python/tuple
      - 3
      - <
      - null
      - null
      - null
      - -1
      - -1
      - 0
    - false
    - !!binary |
      6RzTPXVNQb7seW+/uWClPQCf5DwPGXQ9G1WePo3UFz6KNp4+FW29PKUMYb5cODu+UbHTPWSOQL53
      uc48guEYPn4qgT6KxCO/ER4aPgElyT4BsV6+jpz4valJYj54Z4q+di9MvkSt3z2KlVi/lI+kPVRf
      DD+rzu8+CC1svkHG2ruaX9I9tog+vniP5j2YLva8L589vhSeSL/l4PE9s+6VPJZ2szsyuQi+1Opi
      PU7OzbxdUNc/RtTqPfLVnL5ASu0+fp6mPuvjLryKgqU9p4hVu2In9T2D1ri+vAz5PHVzzz3ac+G9
      Ecu9PZx+Hj6Mrx49kWyAPfqRNj6s4WW+BjmJPlp7+L0eN1g+UzhKPMuUkr7yhl29DwY8viWowbyS
      iUe9igiJPX+YgT5CNy++JExQvirydT1kAdA9V3TjvcHclz2aklg+QtSYPahhl75+c9U9yzjjvHAm
      973nkJm9KkJEPvg9dL2KZYE+GmnxvGzyk75R9c8+KuMGvqXd6r3sxZg9Nv0jPmTSS76EHfe90mGq
      Pd2alb0BxbW+HNUcPxoIwD16mQ++PkZCvhh8jT5I6Kg/HT1pPUMkWj4dO4I9dePAu3qRqb1s/Zo+
      G+Mrvf4WIz+DW7o+yHIePsTqRry9aGk+HVjvPRnqc7xE9S495SlKvOMueD9qdKG+kabJvaV17z3B
      Q5g8VVjYuvwZbz22gwi+B98XPSBKIz8+dVc+Gq+FPcAYlr301Vw9L0y2vQj5pL36o9Q+sgqHPs++
      3z1xMCQ/
  scale: !!python/object/apply:numpy.core.multiarray._reconstruct
    args:
    - *id001
    - !!python/tuple
      - 0
    - !!binary |
      Yg==
    state: !!python/tuple
    - 1
    - !!python/tuple
      - 144
    - *id002
    - false
    - !!binary |
      OanzPqWL3T4RC9M+kg0VP0g2ED8rY/E+UDTvPrfl2T7xOOA+C97MPp688D4/LvE+r3rbPgGi5z47
      MNI+VOHEPgbm2D5gJs0+higRP8sS5z7TvQY/y8rXPnlO1j42lvg++sr0PocB5D5JMtU+2mj0PkBu
      HD8joiU/1ibePq5jyD4ReO4+CE7YPgbv6j79B7s+euHxPobUxz7c8vc+DhicP9qf6z4SVQA/UpHx
      Pu6tzD7MChM/1wj3Po76xz4WyEY/wtvdPkRM6T7xdfg+YGXfPnrHAj984tQ+EFTqPqSQCz+O3RI/
      Osq/PsgW1j4aDts+Obr9Ppw45z7nNOU+J9DyPt4D+T468Ao/jzEaP9Fq5j7Gb+U+NALCPrPy3j7U
      BA8/Nl73PiCq0T5qr+Y+FaQVP8+d5j5Ave0+jx7oPlKI6j4q5+U+f//IPqW6DD+UWSE/3WPJPix+
      2D4+kgU/TnYWP7GX1z55iOo+qHP1PgIh3D6zgD4/MHEJP7zp1z5Aqtw+k1X2Pvynyj5PJ88+lhjX
      PrSi2j5F9fk+du3ZPggsyD6yNNE+lmrDPujPNz8Kscc+mx/0Ppaw/T5UoOk+pjHpPgpgxz5flAI/
      MnjSPo190j7X2t8+gmvpPlgnFD9q0CY/u8oQP4ER+D536dc+9LfJPnkQAD/rKMI+i4YIP7xyBz+B
      nf0+VcTKPqbVAT/ck+I+9uTePhdvAz/UGuo+ahfTPt0/9D7shcQ++VnSPphNzz4Ewvk+DlAoP+91
      9j4qV/4+
token_list: exp/phn_tacotron_transformer_tts.v1.ppg_sxliu/tokens.txt
token_type: phn
train_dp_input_dir: null
train_dumpdir: dump/train_no_dev/ppg_sxliu_norm
train_duration_dir: null
train_max_steps: 50000
train_text: data/train_no_dev/text
trainer_type: ARVCTrainer
trg_dev_dumpdir: dump/bdl_dev/ppg_sxliu/norm_ljspeech
trg_feat_type: ppg_sxliu
trg_stats: exp/TXHC_bdl_1032_debug/stats.h5
trg_train_dumpdir: dump/bdl_train_1032/ppg_sxliu/norm_ljspeech
trim_frame_size: 2048
trim_hop_size: 512
trim_silence: false
trim_threshold_in_db: 60
verbose: 1
version: 0.1.0
vocoder:
#   checkpoint: /data/group1/z44476r/Experiments/s3prl-vc/egs/l2-arctic/a2o_vc/exp/TXHC_ppg_sxliu_taco2_ar/checkpoint-10000steps.pkl
#   config: /data/group1/z44476r/Experiments/s3prl-vc/egs/l2-arctic/a2o_vc/exp/TXHC_ppg_sxliu_taco2_ar/config.yml
#   stats: /data/group1/z44476r/Experiments/s3prl-vc/egs/l2-arctic/a2o_vc/exp/TXHC_ppg_sxliu_taco2_ar/stats.h5
  checkpoint: /data/group1/z44476r/Experiments/seq2seq-vc/egs/l2-arctic/lsc/downloads/ppg_sxliu_decoder_plus_pwg_THXC/checkpoint-10000steps.pkl
  config: /data/group1/z44476r/Experiments/seq2seq-vc/egs/l2-arctic/lsc/downloads/ppg_sxliu_decoder_plus_pwg_THXC/config.yml
  stats: /data/group1/z44476r/Experiments/seq2seq-vc/egs/l2-arctic/lsc/downloads/ppg_sxliu_decoder_plus_pwg_THXC/stats.h5
  vocoder_type: s3prl_vc
win_length: null
window: hann