distilbert-fa-pos-lscp-500k / train /train_config.yaml
pooya-mohammadi's picture
Hezar: Upload training files
d2015ef
raw
history blame
393 Bytes
config_type: trainer
device: cuda
init_weights_from: hezarai/distilbert-base-fa
num_dataloader_workers: 4
seed: 42
optimizer:
name: adam
config_type: OPTIMIZER
lr: 2.0e-05
weight_decay: 0.0
scheduler:
name: reduce_on_plateau
config_type: LR_SCHEDULER
verbose: true
batch_size: 64
use_amp: false
metrics:
- seqeval
num_epochs: 3
save_freq: 1
checkpoints_dir: checkpoints/