|
{ |
|
"class_token_index": 128002, |
|
"dropout": 0.1, |
|
"encoder_config": null, |
|
"ent_token": "<<ENT>>", |
|
"eval_every": 2500, |
|
"fine_tune": true, |
|
"freeze_token_rep": false, |
|
"gpu": "pds@a100", |
|
"has_rnn": true, |
|
"hidden_size": 768, |
|
"log_dir": "/gpfsdswork/projects/rech/bwq/upa43yu/gliner-pip/train_gliner/token_gliner_ft_logs/deberta-v3-base_0", |
|
"loss_alpha": -1, |
|
"loss_gamma": 0, |
|
"loss_reduction": "sum", |
|
"lr_encoder": "1e-6", |
|
"lr_others": "1e-6", |
|
"max_len": 384, |
|
"max_neg_type_ratio": 1, |
|
"max_types": 25, |
|
"max_width": 100, |
|
"model_name": "microsoft/deberta-v3-base", |
|
"model_type": "gliner", |
|
"name": "token level gliner", |
|
"num_steps": 30000, |
|
"prev_path": "/gpfswork/rech/bwq/upa43yu/gliner-pip/train_gliner/token_gliner_logs/deberta-v3-base_4/model_30000", |
|
"random_drop": true, |
|
"root_dir": "token_gliner_ft_logs", |
|
"run_time": "3:30:00", |
|
"scheduler_type": "cosine", |
|
"sep_token": "<<SEP>>", |
|
"shuffle_types": true, |
|
"size_sup": -1, |
|
"span_mode": "token_level", |
|
"subtoken_pooling": "first", |
|
"train_batch_size": 8, |
|
"train_data": "/gpfswork/rech/bwq/upa43yu/gliner-pip/train_gliner/train_new.json", |
|
"transformers_version": "4.38.2", |
|
"val_data_dir": "/gpfswork/rech/ohy/upa43yu/NER_datasets", |
|
"vocab_size": 128004, |
|
"warmup_ratio": 0.1, |
|
"weight_decay_encoder": 0.01, |
|
"weight_decay_other": 0.01, |
|
"words_splitter_type": "whitespace" |
|
} |
|
|