Theoreticallyhugo's picture
Training in progress, epoch 4, checkpoint
b8fd02d verified
raw
history blame
7.89 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 4.0,
"eval_steps": 500,
"global_step": 324,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_B-Claim": {
"f1-score": 0.18764302059496568,
"precision": 0.3416666666666667,
"recall": 0.12933753943217666,
"support": 317.0
},
"eval_B-MajorClaim": {
"f1-score": 0.19540229885057472,
"precision": 0.8947368421052632,
"recall": 0.10967741935483871,
"support": 155.0
},
"eval_B-Premise": {
"f1-score": 0.8476339053562143,
"precision": 0.740909090909091,
"recall": 0.9902794653705954,
"support": 823.0
},
"eval_I-Claim": {
"f1-score": 0.4315998169894769,
"precision": 0.6394035246272028,
"recall": 0.3257366482504604,
"support": 4344.0
},
"eval_I-MajorClaim": {
"f1-score": 0.7779799818016379,
"precision": 0.7493426818580193,
"recall": 0.8088930936613056,
"support": 2114.0
},
"eval_I-Premise": {
"f1-score": 0.8948683715038855,
"precision": 0.8376057421174058,
"recall": 0.9605350187403542,
"support": 13607.0
},
"eval_O": {
"f1-score": 0.9980147987727848,
"precision": 0.9970251509961237,
"recall": 0.9990064131514769,
"support": 11071.0
},
"eval_accuracy": 0.8673183065585397,
"eval_loss": 0.3193369209766388,
"eval_macro avg": {
"f1-score": 0.6190203134099342,
"precision": 0.7429556713256817,
"recall": 0.6176379425658869,
"support": 32431.0
},
"eval_runtime": 4.9083,
"eval_samples_per_second": 16.299,
"eval_steps_per_second": 2.037,
"eval_weighted avg": {
"f1-score": 0.8489527906249091,
"precision": 0.8526967051825685,
"recall": 0.8673183065585397,
"support": 32431.0
},
"step": 81
},
{
"epoch": 2.0,
"eval_B-Claim": {
"f1-score": 0.583941605839416,
"precision": 0.6926406926406926,
"recall": 0.5047318611987381,
"support": 317.0
},
"eval_B-MajorClaim": {
"f1-score": 0.8117647058823529,
"precision": 0.745945945945946,
"recall": 0.8903225806451613,
"support": 155.0
},
"eval_B-Premise": {
"f1-score": 0.8943661971830986,
"precision": 0.8649262202043133,
"recall": 0.9258809234507898,
"support": 823.0
},
"eval_I-Claim": {
"f1-score": 0.6197740770932805,
"precision": 0.6271506009898656,
"recall": 0.6125690607734806,
"support": 4344.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8298737427776589,
"precision": 0.7577178585384916,
"recall": 0.9172185430463576,
"support": 2114.0
},
"eval_I-Premise": {
"f1-score": 0.9013697613125952,
"precision": 0.9106660666066607,
"recall": 0.8922613360770192,
"support": 13607.0
},
"eval_O": {
"f1-score": 0.9961487925331883,
"precision": 0.9993636363636363,
"recall": 0.9929545659831993,
"support": 11071.0
},
"eval_accuracy": 0.887854213561099,
"eval_loss": 0.26407390832901,
"eval_macro avg": {
"f1-score": 0.8053198403745129,
"precision": 0.7997730030413723,
"recall": 0.8194198387392494,
"support": 32431.0
},
"eval_runtime": 4.9329,
"eval_samples_per_second": 16.218,
"eval_steps_per_second": 2.027,
"eval_weighted avg": {
"f1-score": 0.8876368199002541,
"precision": 0.8889201304482091,
"recall": 0.887854213561099,
"support": 32431.0
},
"step": 162
},
{
"epoch": 3.0,
"eval_B-Claim": {
"f1-score": 0.5895522388059701,
"precision": 0.7214611872146118,
"recall": 0.49842271293375395,
"support": 317.0
},
"eval_B-MajorClaim": {
"f1-score": 0.8668941979522183,
"precision": 0.9202898550724637,
"recall": 0.8193548387096774,
"support": 155.0
},
"eval_B-Premise": {
"f1-score": 0.8929178470254956,
"precision": 0.8365180467091295,
"recall": 0.9574726609963548,
"support": 823.0
},
"eval_I-Claim": {
"f1-score": 0.6548140728684112,
"precision": 0.7178149876475433,
"recall": 0.6019797421731123,
"support": 4344.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8815622622368754,
"precision": 0.9502460360852925,
"recall": 0.8221381267738883,
"support": 2114.0
},
"eval_I-Premise": {
"f1-score": 0.9169943670953343,
"precision": 0.8852257181942544,
"recall": 0.9511280958330272,
"support": 13607.0
},
"eval_O": {
"f1-score": 0.9984170774727511,
"precision": 0.9998188405797102,
"recall": 0.9970192394544305,
"support": 11071.0
},
"eval_accuracy": 0.9067250470229101,
"eval_loss": 0.25323203206062317,
"eval_macro avg": {
"f1-score": 0.8287360090652937,
"precision": 0.8616249530718579,
"recall": 0.8067879166963207,
"support": 32431.0
},
"eval_runtime": 4.9025,
"eval_samples_per_second": 16.318,
"eval_steps_per_second": 2.04,
"eval_weighted avg": {
"f1-score": 0.9033110548907601,
"precision": 0.9034896128542845,
"recall": 0.9067250470229101,
"support": 32431.0
},
"step": 243
},
{
"epoch": 4.0,
"eval_B-Claim": {
"f1-score": 0.6806136680613668,
"precision": 0.61,
"recall": 0.7697160883280757,
"support": 317.0
},
"eval_B-MajorClaim": {
"f1-score": 0.8861538461538462,
"precision": 0.8470588235294118,
"recall": 0.9290322580645162,
"support": 155.0
},
"eval_B-Premise": {
"f1-score": 0.8687258687258688,
"precision": 0.9233926128590971,
"recall": 0.8201701093560145,
"support": 823.0
},
"eval_I-Claim": {
"f1-score": 0.656155854589275,
"precision": 0.5819380121125757,
"recall": 0.7520718232044199,
"support": 4344.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8818897637795275,
"precision": 0.8408408408408409,
"recall": 0.9271523178807947,
"support": 2114.0
},
"eval_I-Premise": {
"f1-score": 0.8829758349171871,
"precision": 0.9349433218334154,
"recall": 0.836481222899978,
"support": 13607.0
},
"eval_O": {
"f1-score": 0.9971017118014671,
"precision": 0.9998183634547271,
"recall": 0.9943997832174148,
"support": 11071.0
},
"eval_accuracy": 0.8843698930036077,
"eval_loss": 0.2791365385055542,
"eval_macro avg": {
"f1-score": 0.8362309354326484,
"precision": 0.8197131392328668,
"recall": 0.8612890861358877,
"support": 32431.0
},
"eval_runtime": 4.9234,
"eval_samples_per_second": 16.249,
"eval_steps_per_second": 2.031,
"eval_weighted avg": {
"f1-score": 0.889158243622726,
"precision": 0.8997827813567029,
"recall": 0.8843698930036077,
"support": 32431.0
},
"step": 324
}
],
"logging_steps": 500,
"max_steps": 4050,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 500,
"total_flos": 575163250872000.0,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}