|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
seed: 2995 |
|
__set_seed: !apply:torch.manual_seed [2995] |
|
output_folder: results/RNN/2995 |
|
save_folder: results/RNN/2995/save |
|
train_log: results/RNN/2995/train_log.txt |
|
|
|
|
|
|
|
|
|
data_folder: ../cv_de_acc/ |
|
|
|
|
|
|
|
|
|
lm_corpus_path: lm_corpus/orignal_data/de_lm_normalized.txt |
|
|
|
|
|
|
|
tokenizer_file: ../Tokenizer/results/unigram/1000_unigram.model |
|
|
|
|
|
number_of_epochs: 20 |
|
batch_size: 128 |
|
lr: 0.001 |
|
accu_steps: 1 |
|
ckpt_interval_minutes: 15 |
|
|
|
|
|
train_dataloader_opts: |
|
batch_size: 128 |
|
shuffle: true |
|
|
|
valid_dataloader_opts: |
|
batch_size: 1 |
|
|
|
test_dataloader_opts: |
|
batch_size: 1 |
|
|
|
|
|
emb_size: 128 |
|
activation: &id001 !name:torch.nn.LeakyReLU |
|
dropout: 0.0 |
|
rnn_layers: 2 |
|
rnn_neurons: 2048 |
|
dnn_blocks: 1 |
|
dnn_neurons: 512 |
|
|
|
|
|
output_neurons: 1000 |
|
|
|
bos_index: 0 |
|
eos_index: 0 |
|
|
|
|
|
|
|
model: &id002 !new:speechbrain.lobes.models.RNNLM.RNNLM |
|
|
|
output_neurons: 1000 |
|
embedding_dim: 128 |
|
activation: *id001 |
|
dropout: 0.0 |
|
rnn_layers: 2 |
|
rnn_neurons: 2048 |
|
dnn_blocks: 1 |
|
dnn_neurons: 512 |
|
|
|
modules: |
|
model: *id002 |
|
checkpointer: !new:speechbrain.utils.checkpoints.Checkpointer |
|
checkpoints_dir: results/RNN/2995/save |
|
recoverables: |
|
model: *id002 |
|
scheduler: &id003 !new:speechbrain.nnet.schedulers.NewBobScheduler |
|
initial_value: 0.001 |
|
improvement_threshold: 0.0025 |
|
annealing_factor: 0.8 |
|
patient: 0 |
|
|
|
counter: &id004 !new:speechbrain.utils.epoch_loop.EpochCounter |
|
|
|
limit: 20 |
|
|
|
log_softmax: !new:speechbrain.nnet.activations.Softmax |
|
apply_log: true |
|
|
|
optimizer: !name:torch.optim.Adam |
|
lr: 0.001 |
|
betas: (0.9, 0.98) |
|
eps: 0.000000001 |
|
|
|
lr_annealing: *id003 |
|
epoch_counter: *id004 |
|
compute_cost: !name:speechbrain.nnet.losses.nll_loss |
|
|
|
train_logger: !new:speechbrain.utils.train_logger.FileTrainLogger |
|
save_file: results/RNN/2995/train_log.txt |
|
|
|
tokenizer: &id005 !new:sentencepiece.SentencePieceProcessor |
|
|
|
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer |
|
collect_in: results/RNN/2995/save |
|
loadables: |
|
tokenizer: *id005 |
|
paths: |
|
tokenizer: ../Tokenizer/results/unigram/1000_unigram.model |
|
|