|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 3.0, |
|
"eval_steps": 500, |
|
"global_step": 243, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_B-Claim": { |
|
"f1-score": 0.17153996101364524, |
|
"precision": 0.25287356321839083, |
|
"recall": 0.12979351032448377, |
|
"support": 339.0 |
|
}, |
|
"eval_B-MajorClaim": { |
|
"f1-score": 0.08383233532934131, |
|
"precision": 1.0, |
|
"recall": 0.04375, |
|
"support": 160.0 |
|
}, |
|
"eval_B-Premise": { |
|
"f1-score": 0.8469620831429876, |
|
"precision": 0.7427884615384616, |
|
"recall": 0.9851222104144527, |
|
"support": 941.0 |
|
}, |
|
"eval_I-Claim": { |
|
"f1-score": 0.5420081967213116, |
|
"precision": 0.6803858520900321, |
|
"recall": 0.4504044274159217, |
|
"support": 4698.0 |
|
}, |
|
"eval_I-MajorClaim": { |
|
"f1-score": 0.8343351767251743, |
|
"precision": 0.8141717503519474, |
|
"recall": 0.8555226824457594, |
|
"support": 2028.0 |
|
}, |
|
"eval_I-Premise": { |
|
"f1-score": 0.9004323458767015, |
|
"precision": 0.8590809093131264, |
|
"recall": 0.9459659511472983, |
|
"support": 14861.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9988389078242631, |
|
"precision": 0.9991008541885209, |
|
"recall": 0.9985770987793006, |
|
"support": 13353.0 |
|
}, |
|
"eval_accuracy": 0.8856789444749863, |
|
"eval_loss": 0.28347474336624146, |
|
"eval_macro avg": { |
|
"f1-score": 0.6254212866619178, |
|
"precision": 0.76405734152864, |
|
"recall": 0.629876554361031, |
|
"support": 36380.0 |
|
}, |
|
"eval_runtime": 5.0448, |
|
"eval_samples_per_second": 16.056, |
|
"eval_steps_per_second": 2.18, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8748148382495958, |
|
"precision": 0.8768575102351055, |
|
"recall": 0.8856789444749863, |
|
"support": 36380.0 |
|
}, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_B-Claim": { |
|
"f1-score": 0.5137931034482759, |
|
"precision": 0.6182572614107884, |
|
"recall": 0.43952802359882004, |
|
"support": 339.0 |
|
}, |
|
"eval_B-MajorClaim": { |
|
"f1-score": 0.7622641509433963, |
|
"precision": 0.9619047619047619, |
|
"recall": 0.63125, |
|
"support": 160.0 |
|
}, |
|
"eval_B-Premise": { |
|
"f1-score": 0.8853910477127397, |
|
"precision": 0.8241758241758241, |
|
"recall": 0.9564293304994687, |
|
"support": 941.0 |
|
}, |
|
"eval_I-Claim": { |
|
"f1-score": 0.5413588470388762, |
|
"precision": 0.6279853891542568, |
|
"recall": 0.47573435504469985, |
|
"support": 4698.0 |
|
}, |
|
"eval_I-MajorClaim": { |
|
"f1-score": 0.7949260042283298, |
|
"precision": 0.856492027334852, |
|
"recall": 0.7416173570019724, |
|
"support": 2028.0 |
|
}, |
|
"eval_I-Premise": { |
|
"f1-score": 0.9007064868336545, |
|
"precision": 0.8614779777627618, |
|
"recall": 0.9436780835744566, |
|
"support": 14861.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9988389947942025, |
|
"precision": 0.9990260713215463, |
|
"recall": 0.9986519883172321, |
|
"support": 13353.0 |
|
}, |
|
"eval_accuracy": 0.8864211105002748, |
|
"eval_loss": 0.2809496521949768, |
|
"eval_macro avg": { |
|
"f1-score": 0.7710398049999251, |
|
"precision": 0.8213313304378275, |
|
"recall": 0.7409841625766643, |
|
"support": 36380.0 |
|
}, |
|
"eval_runtime": 5.0579, |
|
"eval_samples_per_second": 16.014, |
|
"eval_steps_per_second": 2.175, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8798131143596267, |
|
"precision": 0.8787439244541853, |
|
"recall": 0.8864211105002748, |
|
"support": 36380.0 |
|
}, |
|
"step": 162 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_B-Claim": { |
|
"f1-score": 0.6401137980085349, |
|
"precision": 0.6181318681318682, |
|
"recall": 0.6637168141592921, |
|
"support": 339.0 |
|
}, |
|
"eval_B-MajorClaim": { |
|
"f1-score": 0.7918781725888324, |
|
"precision": 0.6666666666666666, |
|
"recall": 0.975, |
|
"support": 160.0 |
|
}, |
|
"eval_B-Premise": { |
|
"f1-score": 0.8866442199775534, |
|
"precision": 0.93935790725327, |
|
"recall": 0.8395324123273114, |
|
"support": 941.0 |
|
}, |
|
"eval_I-Claim": { |
|
"f1-score": 0.6254390633315594, |
|
"precision": 0.6255056418990845, |
|
"recall": 0.6253724989357173, |
|
"support": 4698.0 |
|
}, |
|
"eval_I-MajorClaim": { |
|
"f1-score": 0.76480605487228, |
|
"precision": 0.6205096714768191, |
|
"recall": 0.9965483234714004, |
|
"support": 2028.0 |
|
}, |
|
"eval_I-Premise": { |
|
"f1-score": 0.9049205625504156, |
|
"precision": 0.9449897450922942, |
|
"recall": 0.868111163447951, |
|
"support": 14861.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9988758992805756, |
|
"precision": 0.9995500562429697, |
|
"recall": 0.9982026510896428, |
|
"support": 13353.0 |
|
}, |
|
"eval_accuracy": 0.8894997251236944, |
|
"eval_loss": 0.318760484457016, |
|
"eval_macro avg": { |
|
"f1-score": 0.8018111100871074, |
|
"precision": 0.7735302223947104, |
|
"recall": 0.852354837633045, |
|
"support": 36380.0 |
|
}, |
|
"eval_runtime": 5.0862, |
|
"eval_samples_per_second": 15.925, |
|
"eval_steps_per_second": 2.163, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8920666591013163, |
|
"precision": 0.9012548868310761, |
|
"recall": 0.8894997251236944, |
|
"support": 36380.0 |
|
}, |
|
"step": 243 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4050, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 50, |
|
"save_steps": 500, |
|
"total_flos": 430032772197000.0, |
|
"train_batch_size": 4, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|