nerugm-pt-pl20-2 / trainer_state.json
apwic's picture
End of training
f076397 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.6106630563735962,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9915,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.025157232704402517,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.125,
"eval_PERSON_recall": 0.013986013986013986,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5523906946182251,
"eval_overall_accuracy": 0.8478859144358268,
"eval_overall_f1": 0.010869565217391304,
"eval_overall_precision": 0.06896551724137931,
"eval_overall_recall": 0.0058997050147492625,
"eval_runtime": 0.3759,
"eval_samples_per_second": 497.497,
"eval_steps_per_second": 7.981,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.0314005613327026,
"learning_rate": 4.9e-05,
"loss": 0.5062,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.05063291139240506,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.2857142857142857,
"eval_LOCATION_recall": 0.027777777777777776,
"eval_ORGANIZATION_f1": 0.0196078431372549,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.037037037037037035,
"eval_ORGANIZATION_recall": 0.013333333333333334,
"eval_PERSON_f1": 0.5257142857142857,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.4444444444444444,
"eval_PERSON_recall": 0.6433566433566433,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.5306122448979592,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.5652173913043478,
"eval_TIME_recall": 0.5,
"eval_loss": 0.3515785038471222,
"eval_overall_accuracy": 0.8919189392044033,
"eval_overall_f1": 0.3517915309446254,
"eval_overall_precision": 0.3927272727272727,
"eval_overall_recall": 0.3185840707964602,
"eval_runtime": 0.3751,
"eval_samples_per_second": 498.534,
"eval_steps_per_second": 7.998,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.118065595626831,
"learning_rate": 4.85e-05,
"loss": 0.325,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.5935483870967742,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.5542168674698795,
"eval_LOCATION_recall": 0.6388888888888888,
"eval_ORGANIZATION_f1": 0.5517241379310344,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.48484848484848486,
"eval_ORGANIZATION_recall": 0.64,
"eval_PERSON_f1": 0.8269230769230769,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7633136094674556,
"eval_PERSON_recall": 0.9020979020979021,
"eval_QUANTITY_f1": 0.41791044776119407,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.3181818181818182,
"eval_QUANTITY_recall": 0.6086956521739131,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.2219165712594986,
"eval_overall_accuracy": 0.9271953965474106,
"eval_overall_f1": 0.673656618610747,
"eval_overall_precision": 0.6061320754716981,
"eval_overall_recall": 0.7581120943952803,
"eval_runtime": 0.3771,
"eval_samples_per_second": 495.952,
"eval_steps_per_second": 7.956,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.4435498714447021,
"learning_rate": 4.8e-05,
"loss": 0.2281,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.7096774193548386,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6626506024096386,
"eval_LOCATION_recall": 0.7638888888888888,
"eval_ORGANIZATION_f1": 0.6022727272727274,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5247524752475248,
"eval_ORGANIZATION_recall": 0.7066666666666667,
"eval_PERSON_f1": 0.8525641025641025,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7869822485207101,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.3287671232876712,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.24,
"eval_QUANTITY_recall": 0.5217391304347826,
"eval_TIME_f1": 0.6885245901639345,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.20335395634174347,
"eval_overall_accuracy": 0.9342006504878659,
"eval_overall_f1": 0.7052767052767053,
"eval_overall_precision": 0.6255707762557078,
"eval_overall_recall": 0.8082595870206489,
"eval_runtime": 0.3755,
"eval_samples_per_second": 497.982,
"eval_steps_per_second": 7.989,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 0.9061490297317505,
"learning_rate": 4.75e-05,
"loss": 0.1893,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.625,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5445544554455446,
"eval_ORGANIZATION_recall": 0.7333333333333333,
"eval_PERSON_f1": 0.8692810457516339,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8159509202453987,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.4838709677419355,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.38461538461538464,
"eval_QUANTITY_recall": 0.6521739130434783,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.16108748316764832,
"eval_overall_accuracy": 0.9442081561170879,
"eval_overall_f1": 0.7526595744680852,
"eval_overall_precision": 0.6852300242130751,
"eval_overall_recall": 0.8348082595870207,
"eval_runtime": 0.3765,
"eval_samples_per_second": 496.646,
"eval_steps_per_second": 7.968,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.0410338640213013,
"learning_rate": 4.7e-05,
"loss": 0.1709,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7228915662650603,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6382978723404256,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6739130434782608,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5688073394495413,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5517241379310345,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.45714285714285713,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15253682434558868,
"eval_overall_accuracy": 0.9482111583687766,
"eval_overall_f1": 0.7692307692307694,
"eval_overall_precision": 0.6892523364485982,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3747,
"eval_samples_per_second": 499.072,
"eval_steps_per_second": 8.007,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.6735289692878723,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1574,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7564102564102564,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7052023121387283,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6224489795918368,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.59375,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.4634146341463415,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15402045845985413,
"eval_overall_accuracy": 0.9489617212909682,
"eval_overall_f1": 0.7845744680851063,
"eval_overall_precision": 0.7142857142857143,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3759,
"eval_samples_per_second": 497.519,
"eval_steps_per_second": 7.982,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.6694019436836243,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1455,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7272727272727273,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6829268292682927,
"eval_LOCATION_recall": 0.7777777777777778,
"eval_ORGANIZATION_f1": 0.7078651685393258,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6116504854368932,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.6666666666666667,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.5882352941176471,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.14883330464363098,
"eval_overall_accuracy": 0.9479609707280461,
"eval_overall_f1": 0.7792553191489361,
"eval_overall_precision": 0.7094430992736077,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.3757,
"eval_samples_per_second": 497.723,
"eval_steps_per_second": 7.985,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.2299126386642456,
"learning_rate": 4.55e-05,
"loss": 0.1415,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7071823204419889,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6037735849056604,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7037037037037037,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6129032258064516,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7017543859649122,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6451612903225806,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.15283024311065674,
"eval_overall_accuracy": 0.9472104078058544,
"eval_overall_f1": 0.7951807228915664,
"eval_overall_precision": 0.7279411764705882,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3787,
"eval_samples_per_second": 493.807,
"eval_steps_per_second": 7.922,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 2.041289806365967,
"learning_rate": 4.5e-05,
"loss": 0.1317,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7702702702702704,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.6779661016949153,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5882352941176471,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.631578947368421,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5294117647058824,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13493530452251434,
"eval_overall_accuracy": 0.9527145359019265,
"eval_overall_f1": 0.7891891891891892,
"eval_overall_precision": 0.7281795511221946,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.779,
"eval_steps_per_second": 7.857,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.6205049753189087,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1258,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7484662576687117,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6931818181818182,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8866666666666668,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8471337579617835,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13175755739212036,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8104395604395604,
"eval_overall_precision": 0.7583547557840618,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3776,
"eval_samples_per_second": 495.218,
"eval_steps_per_second": 7.945,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.5989289283752441,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1198,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7651006711409396,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7402597402597403,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7058823529411765,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7547169811320754,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.136313334107399,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8195804195804196,
"eval_overall_precision": 0.7792553191489362,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.3791,
"eval_samples_per_second": 493.255,
"eval_steps_per_second": 7.913,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.6925050020217896,
"learning_rate": 4.35e-05,
"loss": 0.1144,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.75,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7125,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.7403314917127072,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6320754716981132,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1362464725971222,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8157181571815718,
"eval_overall_precision": 0.7543859649122807,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.964,
"eval_steps_per_second": 8.037,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.0199106931686401,
"learning_rate": 4.3e-05,
"loss": 0.1142,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6440677966101694,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5277777777777778,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13535019755363464,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8257887517146778,
"eval_overall_precision": 0.7717948717948718,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3744,
"eval_samples_per_second": 499.47,
"eval_steps_per_second": 8.013,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.6930171847343445,
"learning_rate": 4.25e-05,
"loss": 0.1079,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7671232876712328,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7567567567567568,
"eval_LOCATION_recall": 0.7777777777777778,
"eval_ORGANIZATION_f1": 0.785276073619632,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.12985557317733765,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8296089385474861,
"eval_overall_precision": 0.7877984084880637,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3768,
"eval_samples_per_second": 496.275,
"eval_steps_per_second": 7.962,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.7586736679077148,
"learning_rate": 4.2e-05,
"loss": 0.1044,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7947019867549668,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7683615819209039,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14694638550281525,
"eval_overall_accuracy": 0.9547160370277709,
"eval_overall_f1": 0.8267394270122784,
"eval_overall_precision": 0.7690355329949239,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3758,
"eval_samples_per_second": 497.662,
"eval_steps_per_second": 7.984,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.3470544219017029,
"learning_rate": 4.15e-05,
"loss": 0.099,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7730061349693251,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7159090909090909,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8896321070234114,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8525641025641025,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1366996318101883,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8200836820083682,
"eval_overall_precision": 0.7777777777777778,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.281,
"eval_steps_per_second": 8.042,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 1.08118736743927,
"learning_rate": 4.1e-05,
"loss": 0.095,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7904191616766466,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.717391304347826,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8859060402684563,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8516129032258064,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1454007923603058,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.825,
"eval_overall_precision": 0.7795275590551181,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.375,
"eval_samples_per_second": 498.648,
"eval_steps_per_second": 8.0,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.5193635821342468,
"learning_rate": 4.05e-05,
"loss": 0.0926,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8956228956228957,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8636363636363636,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13837505877017975,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8277777777777778,
"eval_overall_precision": 0.7821522309711286,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3771,
"eval_samples_per_second": 495.921,
"eval_steps_per_second": 7.956,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.9454425573348999,
"learning_rate": 4e-05,
"loss": 0.088,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7674418604651163,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6804123711340206,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5588235294117647,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8076923076923077,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8076923076923077,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.16045436263084412,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.8285322359396433,
"eval_overall_precision": 0.7743589743589744,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.378,
"eval_samples_per_second": 494.772,
"eval_steps_per_second": 7.938,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.5755162239074707,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0878,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7972972972972973,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7555555555555555,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6476190476190476,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7037037037037037,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6129032258064516,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8627450980392156,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.88,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14829762279987335,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.8290013679890561,
"eval_overall_precision": 0.7729591836734694,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.375,
"eval_samples_per_second": 498.697,
"eval_steps_per_second": 8.0,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.5230295658111572,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.089,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7608695652173914,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6422018348623854,
"eval_ORGANIZATION_recall": 0.9333333333333333,
"eval_PERSON_f1": 0.9072847682119206,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6440677966101694,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5277777777777778,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15434490144252777,
"eval_overall_accuracy": 0.9534650988241181,
"eval_overall_f1": 0.8214765100671141,
"eval_overall_precision": 0.7536945812807881,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3743,
"eval_samples_per_second": 499.582,
"eval_steps_per_second": 8.015,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.4608692526817322,
"learning_rate": 3.85e-05,
"loss": 0.0835,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7529411764705883,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6736842105263158,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8076923076923077,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8076923076923077,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14608316123485565,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8238557558945908,
"eval_overall_precision": 0.7774869109947644,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3748,
"eval_samples_per_second": 498.876,
"eval_steps_per_second": 8.003,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 0.6337035298347473,
"learning_rate": 3.8e-05,
"loss": 0.0789,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8513513513513513,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.912751677852349,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8235294117647058,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.84,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1453711837530136,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8379888268156425,
"eval_overall_precision": 0.7957559681697612,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3753,
"eval_samples_per_second": 498.308,
"eval_steps_per_second": 7.994,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.5838052034378052,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0773,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7757575757575759,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7111111111111111,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13762633502483368,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8372739916550764,
"eval_overall_precision": 0.7921052631578948,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3758,
"eval_samples_per_second": 497.612,
"eval_steps_per_second": 7.983,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.6994030475616455,
"learning_rate": 3.7e-05,
"loss": 0.0779,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7455621301775148,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6702127659574468,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1366981565952301,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8294036061026352,
"eval_overall_precision": 0.7827225130890052,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3759,
"eval_samples_per_second": 497.412,
"eval_steps_per_second": 7.98,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.5041149258613586,
"learning_rate": 3.65e-05,
"loss": 0.0735,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8378378378378378,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.759493670886076,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7228915662650602,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1394449919462204,
"eval_overall_accuracy": 0.9629722291718789,
"eval_overall_f1": 0.8470254957507082,
"eval_overall_precision": 0.8147138964577657,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3746,
"eval_samples_per_second": 499.149,
"eval_steps_per_second": 8.008,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.0946162939071655,
"learning_rate": 3.6e-05,
"loss": 0.0718,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7682926829268292,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7078651685393258,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.91156462585034,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8874172185430463,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13758285343647003,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8330995792426367,
"eval_overall_precision": 0.7941176470588235,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3762,
"eval_samples_per_second": 497.123,
"eval_steps_per_second": 7.975,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.6572793126106262,
"learning_rate": 3.55e-05,
"loss": 0.071,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7558139534883721,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6701030927835051,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.912751677852349,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1548575758934021,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8246575342465754,
"eval_overall_precision": 0.7698209718670077,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.376,
"eval_samples_per_second": 497.4,
"eval_steps_per_second": 7.98,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.7155618071556091,
"learning_rate": 3.5e-05,
"loss": 0.0717,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7945205479452055,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7837837837837838,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7664670658682634,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6956521739130435,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9225589225589226,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8896103896103896,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14325742423534393,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8324022346368715,
"eval_overall_precision": 0.7904509283819628,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3762,
"eval_samples_per_second": 497.023,
"eval_steps_per_second": 7.974,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.44705238938331604,
"learning_rate": 3.45e-05,
"loss": 0.071,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8435374149659863,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7951807228915663,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7252747252747253,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8076923076923077,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8076923076923077,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14365795254707336,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8511235955056179,
"eval_overall_precision": 0.8123324396782842,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3777,
"eval_samples_per_second": 495.054,
"eval_steps_per_second": 7.942,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 2.0400214195251465,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0652,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.785276073619632,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8986486486486487,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.869281045751634,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.142520010471344,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8349788434414668,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.336,
"eval_steps_per_second": 8.027,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.2415409088134766,
"learning_rate": 3.35e-05,
"loss": 0.0664,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1492750197649002,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8443197755960731,
"eval_overall_precision": 0.8048128342245989,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3741,
"eval_samples_per_second": 499.878,
"eval_steps_per_second": 8.019,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.1798769235610962,
"learning_rate": 3.3e-05,
"loss": 0.0623,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8157894736842106,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7790697674418604,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6907216494845361,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1654369980096817,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.829467939972715,
"eval_overall_precision": 0.7715736040609137,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3791,
"eval_samples_per_second": 493.243,
"eval_steps_per_second": 7.913,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.1484782695770264,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0615,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7757575757575759,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7111111111111111,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8986486486486487,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.869281045751634,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1493893563747406,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.827972027972028,
"eval_overall_precision": 0.7872340425531915,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.379,
"eval_samples_per_second": 493.425,
"eval_steps_per_second": 7.916,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.2095956802368164,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0589,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14943872392177582,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8423988842398884,
"eval_overall_precision": 0.798941798941799,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3796,
"eval_samples_per_second": 492.653,
"eval_steps_per_second": 7.904,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.9618573784828186,
"learning_rate": 3.15e-05,
"loss": 0.0576,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7764705882352942,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6947368421052632,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15785393118858337,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8326417704011065,
"eval_overall_precision": 0.7838541666666666,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3772,
"eval_samples_per_second": 495.804,
"eval_steps_per_second": 7.954,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.4735202491283417,
"learning_rate": 3.1e-05,
"loss": 0.0586,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7950310559006211,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7441860465116279,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15275536477565765,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8347338935574229,
"eval_overall_precision": 0.7946666666666666,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3775,
"eval_samples_per_second": 495.303,
"eval_steps_per_second": 7.946,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.5576403141021729,
"learning_rate": 3.05e-05,
"loss": 0.0577,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9261744966442954,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16170634329319,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8507670850767085,
"eval_overall_precision": 0.8068783068783069,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3771,
"eval_samples_per_second": 495.837,
"eval_steps_per_second": 7.955,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.4916011393070221,
"learning_rate": 3e-05,
"loss": 0.0536,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8421052631578948,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15796098113059998,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8344923504867873,
"eval_overall_precision": 0.7894736842105263,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3745,
"eval_samples_per_second": 499.28,
"eval_steps_per_second": 8.01,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.9400687217712402,
"learning_rate": 2.95e-05,
"loss": 0.0572,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7664670658682634,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6956521739130435,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8846153846153846,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8846153846153846,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1550283432006836,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8472222222222222,
"eval_overall_precision": 0.800524934383202,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3774,
"eval_samples_per_second": 495.49,
"eval_steps_per_second": 7.949,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 1.621040940284729,
"learning_rate": 2.9e-05,
"loss": 0.0524,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7037037037037037,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6129032258064516,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1589338332414627,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8319559228650136,
"eval_overall_precision": 0.7803617571059431,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3778,
"eval_samples_per_second": 495.011,
"eval_steps_per_second": 7.941,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.5988844037055969,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.052,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15005570650100708,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8401697312588402,
"eval_overall_precision": 0.8070652173913043,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.434,
"eval_steps_per_second": 8.028,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.9367622137069702,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0509,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8053691275167787,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7875000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7411764705882353,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15873059630393982,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8387096774193548,
"eval_overall_precision": 0.7994652406417112,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3736,
"eval_samples_per_second": 500.546,
"eval_steps_per_second": 8.03,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.6508892178535461,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.049,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15799470245838165,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8328690807799444,
"eval_overall_precision": 0.7889182058047494,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.375,
"eval_samples_per_second": 498.627,
"eval_steps_per_second": 7.999,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.3828009068965912,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0479,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8513513513513513,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1539916843175888,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.848314606741573,
"eval_overall_precision": 0.8096514745308311,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3768,
"eval_samples_per_second": 496.259,
"eval_steps_per_second": 7.961,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 1.15745210647583,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0488,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7484662576687117,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6931818181818182,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8786885245901639,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8271604938271605,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1685992181301117,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.825,
"eval_overall_precision": 0.7795275590551181,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3766,
"eval_samples_per_second": 496.508,
"eval_steps_per_second": 7.965,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.9865849614143372,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0468,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7058823529411765,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.15260353684425354,
"eval_overall_accuracy": 0.9632224168126094,
"eval_overall_f1": 0.840620592383639,
"eval_overall_precision": 0.8054054054054054,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3789,
"eval_samples_per_second": 493.563,
"eval_steps_per_second": 7.918,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.6459212303161621,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0474,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16667716205120087,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8396094839609484,
"eval_overall_precision": 0.7962962962962963,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3755,
"eval_samples_per_second": 498.016,
"eval_steps_per_second": 7.99,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.7612103223800659,
"learning_rate": 2.5e-05,
"loss": 0.0485,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.782051282051282,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7530864197530864,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.912751677852349,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8627450980392156,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.88,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15263156592845917,
"eval_overall_accuracy": 0.96347260445334,
"eval_overall_f1": 0.8530670470756063,
"eval_overall_precision": 0.8259668508287292,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.377,
"eval_samples_per_second": 496.057,
"eval_steps_per_second": 7.958,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.8503948450088501,
"learning_rate": 2.45e-05,
"loss": 0.0443,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8435374149659863,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7784431137724551,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7065217391304348,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9266666666666666,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.972027972027972,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16938814520835876,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8539638386648123,
"eval_overall_precision": 0.8078947368421052,
"eval_overall_recall": 0.9056047197640118,
"eval_runtime": 0.3781,
"eval_samples_per_second": 494.577,
"eval_steps_per_second": 7.934,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.4882877767086029,
"learning_rate": 2.4e-05,
"loss": 0.0468,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7701863354037267,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7209302325581395,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1636158525943756,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.827972027972028,
"eval_overall_precision": 0.7872340425531915,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3764,
"eval_samples_per_second": 496.803,
"eval_steps_per_second": 7.97,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.0076719522476196,
"learning_rate": 2.35e-05,
"loss": 0.0439,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8137931034482759,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8082191780821918,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.785276073619632,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.923076923076923,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16856712102890015,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8447552447552448,
"eval_overall_precision": 0.8031914893617021,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3772,
"eval_samples_per_second": 495.818,
"eval_steps_per_second": 7.954,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.4930567443370819,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0449,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7826086956521738,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7325581395348837,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16776379942893982,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8456189151599444,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3777,
"eval_samples_per_second": 495.066,
"eval_steps_per_second": 7.942,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 1.5758038759231567,
"learning_rate": 2.25e-05,
"loss": 0.0428,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.92,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7931034482758621,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.71875,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17032887041568756,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8425414364640885,
"eval_overall_precision": 0.7922077922077922,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3758,
"eval_samples_per_second": 497.571,
"eval_steps_per_second": 7.982,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.7785055637359619,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.043,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7710843373493976,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7032967032967034,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9328859060402686,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.972027972027972,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1670546680688858,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8472222222222222,
"eval_overall_precision": 0.800524934383202,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3758,
"eval_samples_per_second": 497.561,
"eval_steps_per_second": 7.982,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.49103009700775146,
"learning_rate": 2.15e-05,
"loss": 0.0405,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7848101265822784,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7469879518072289,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9225589225589226,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8896103896103896,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15890353918075562,
"eval_overall_accuracy": 0.9624718538904178,
"eval_overall_f1": 0.851063829787234,
"eval_overall_precision": 0.819672131147541,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3783,
"eval_samples_per_second": 494.38,
"eval_steps_per_second": 7.931,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.5003204345703125,
"learning_rate": 2.1e-05,
"loss": 0.0402,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7654320987654321,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7126436781609196,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16718268394470215,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8368200836820084,
"eval_overall_precision": 0.7936507936507936,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.378,
"eval_samples_per_second": 494.745,
"eval_steps_per_second": 7.937,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.12552323937416077,
"learning_rate": 2.05e-05,
"loss": 0.0408,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.16901348531246185,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8415147265077138,
"eval_overall_precision": 0.8021390374331551,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3776,
"eval_samples_per_second": 495.25,
"eval_steps_per_second": 7.945,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.5769420266151428,
"learning_rate": 2e-05,
"loss": 0.0384,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.92,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7586206896551724,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6875,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1785995215177536,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8351648351648351,
"eval_overall_precision": 0.781491002570694,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.377,
"eval_samples_per_second": 496.039,
"eval_steps_per_second": 7.958,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.23254899680614471,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0381,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8226950354609929,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8405797101449275,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.763157894736842,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7532467532467533,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1716317981481552,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8374100719424461,
"eval_overall_precision": 0.8174157303370787,
"eval_overall_recall": 0.8584070796460177,
"eval_runtime": 0.3772,
"eval_samples_per_second": 495.814,
"eval_steps_per_second": 7.954,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.6055287718772888,
"learning_rate": 1.9e-05,
"loss": 0.0393,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7662337662337663,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7468354430379747,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16724902391433716,
"eval_overall_accuracy": 0.9632224168126094,
"eval_overall_f1": 0.844950213371266,
"eval_overall_precision": 0.8159340659340659,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3757,
"eval_samples_per_second": 497.776,
"eval_steps_per_second": 7.986,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.6947082877159119,
"learning_rate": 1.85e-05,
"loss": 0.037,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7435897435897435,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.16370835900306702,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8413597733711049,
"eval_overall_precision": 0.8092643051771117,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.376,
"eval_samples_per_second": 497.373,
"eval_steps_per_second": 7.979,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.9311719536781311,
"learning_rate": 1.8e-05,
"loss": 0.0357,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7530864197530864,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7011494252873564,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9139072847682119,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1763332337141037,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8400556328233658,
"eval_overall_precision": 0.7947368421052632,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.375,
"eval_samples_per_second": 498.678,
"eval_steps_per_second": 8.0,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.061806291341781616,
"learning_rate": 1.75e-05,
"loss": 0.0374,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7848101265822784,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7469879518072289,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9261744966442954,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17243608832359314,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.8523206751054851,
"eval_overall_precision": 0.8145161290322581,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.375,
"eval_samples_per_second": 498.652,
"eval_steps_per_second": 8.0,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 1.068263053894043,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0368,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8513513513513513,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17702345550060272,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8503496503496504,
"eval_overall_precision": 0.8085106382978723,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3762,
"eval_samples_per_second": 497.023,
"eval_steps_per_second": 7.974,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.35486891865730286,
"learning_rate": 1.65e-05,
"loss": 0.0374,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.17916804552078247,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8398876404494382,
"eval_overall_precision": 0.8016085790884718,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3755,
"eval_samples_per_second": 497.996,
"eval_steps_per_second": 7.989,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.5311190485954285,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.034,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7421383647798742,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7023809523809523,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9139072847682119,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.18868251144886017,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8324022346368715,
"eval_overall_precision": 0.7904509283819628,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3757,
"eval_samples_per_second": 497.677,
"eval_steps_per_second": 7.984,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 1.173794150352478,
"learning_rate": 1.55e-05,
"loss": 0.0339,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7672955974842767,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7261904761904762,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.17915134131908417,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8418079096045198,
"eval_overall_precision": 0.8075880758807588,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3795,
"eval_samples_per_second": 492.724,
"eval_steps_per_second": 7.905,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.2395267486572266,
"learning_rate": 1.5e-05,
"loss": 0.0346,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.17411379516124725,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8349788434414668,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3754,
"eval_samples_per_second": 498.124,
"eval_steps_per_second": 7.991,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.5333613157272339,
"learning_rate": 1.45e-05,
"loss": 0.0345,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17888005077838898,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8463687150837987,
"eval_overall_precision": 0.8037135278514589,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3785,
"eval_samples_per_second": 494.008,
"eval_steps_per_second": 7.925,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.4179161787033081,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0339,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17914946377277374,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8387096774193548,
"eval_overall_precision": 0.7994652406417112,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.065,
"eval_steps_per_second": 7.894,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 1.2512534856796265,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0363,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7777777777777777,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7241379310344828,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.17584359645843506,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.847124824684432,
"eval_overall_precision": 0.8074866310160428,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3782,
"eval_samples_per_second": 494.451,
"eval_steps_per_second": 7.932,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.7962180972099304,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0309,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7577639751552795,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7093023255813954,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9139072847682119,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1865181177854538,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8472222222222222,
"eval_overall_precision": 0.800524934383202,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3776,
"eval_samples_per_second": 495.244,
"eval_steps_per_second": 7.945,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.6063715219497681,
"learning_rate": 1.25e-05,
"loss": 0.0337,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7625,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7176470588235294,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7450980392156864,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6785714285714286,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1806030422449112,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8451882845188284,
"eval_overall_precision": 0.8015873015873016,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3799,
"eval_samples_per_second": 492.235,
"eval_steps_per_second": 7.897,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.17701131105422974,
"learning_rate": 1.2e-05,
"loss": 0.0329,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7544910179640718,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6847826086956522,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7450980392156864,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6785714285714286,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.1809851974248886,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8444444444444444,
"eval_overall_precision": 0.7979002624671916,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3779,
"eval_samples_per_second": 494.873,
"eval_steps_per_second": 7.939,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 2.978839874267578,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0325,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17838534712791443,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8391608391608392,
"eval_overall_precision": 0.7978723404255319,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3777,
"eval_samples_per_second": 495.055,
"eval_steps_per_second": 7.942,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.9092636704444885,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0313,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8513513513513513,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17731936275959015,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8478873239436621,
"eval_overall_precision": 0.8113207547169812,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.167,
"eval_steps_per_second": 7.896,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 1.61823570728302,
"learning_rate": 1.05e-05,
"loss": 0.0313,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17817345261573792,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8447552447552448,
"eval_overall_precision": 0.8031914893617021,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3792,
"eval_samples_per_second": 493.2,
"eval_steps_per_second": 7.912,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.3510795831680298,
"learning_rate": 1e-05,
"loss": 0.0302,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1888643205165863,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8384401114206128,
"eval_overall_precision": 0.7941952506596306,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3798,
"eval_samples_per_second": 492.423,
"eval_steps_per_second": 7.9,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.5158957242965698,
"learning_rate": 9.5e-06,
"loss": 0.0307,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7672955974842767,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7261904761904762,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.910299003322259,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1804436296224594,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8435754189944135,
"eval_overall_precision": 0.8010610079575596,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3773,
"eval_samples_per_second": 495.674,
"eval_steps_per_second": 7.952,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.9088582396507263,
"learning_rate": 9e-06,
"loss": 0.0289,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7672955974842767,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7261904761904762,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.18571802973747253,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8375350140056023,
"eval_overall_precision": 0.7973333333333333,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3888,
"eval_samples_per_second": 480.946,
"eval_steps_per_second": 7.716,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.08597920835018158,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0312,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.92,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.7037037037037037,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6129032258064516,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.19167569279670715,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8451882845188284,
"eval_overall_precision": 0.8015873015873016,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3776,
"eval_samples_per_second": 495.221,
"eval_steps_per_second": 7.945,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.6576730608940125,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0286,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7672955974842767,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7261904761904762,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18320870399475098,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8398876404494382,
"eval_overall_precision": 0.8016085790884718,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3788,
"eval_samples_per_second": 493.702,
"eval_steps_per_second": 7.92,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 2.442254066467285,
"learning_rate": 7.5e-06,
"loss": 0.0295,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9139072847682119,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18816226720809937,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.84593837535014,
"eval_overall_precision": 0.8053333333333333,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3842,
"eval_samples_per_second": 486.686,
"eval_steps_per_second": 7.808,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 1.4039467573165894,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0285,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7770700636942677,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7439024390243902,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18358004093170166,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8391608391608392,
"eval_overall_precision": 0.7978723404255319,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.834,
"eval_steps_per_second": 7.858,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.6832211017608643,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0264,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1859363615512848,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8403361344537816,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.379,
"eval_samples_per_second": 493.376,
"eval_steps_per_second": 7.915,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.2647896111011505,
"learning_rate": 6e-06,
"loss": 0.0278,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18457496166229248,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8359046283309959,
"eval_overall_precision": 0.7967914438502673,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3779,
"eval_samples_per_second": 494.799,
"eval_steps_per_second": 7.938,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.7398730516433716,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0275,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7848101265822784,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7469879518072289,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18726153671741486,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8403361344537816,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3782,
"eval_samples_per_second": 494.432,
"eval_steps_per_second": 7.932,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.7052929401397705,
"learning_rate": 5e-06,
"loss": 0.0274,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9072847682119206,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18936219811439514,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8451882845188284,
"eval_overall_precision": 0.8015873015873016,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3816,
"eval_samples_per_second": 489.992,
"eval_steps_per_second": 7.861,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.5388996005058289,
"learning_rate": 4.5e-06,
"loss": 0.0276,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1843438744544983,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8375350140056023,
"eval_overall_precision": 0.7973333333333333,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3778,
"eval_samples_per_second": 494.978,
"eval_steps_per_second": 7.941,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 1.5319263935089111,
"learning_rate": 4.000000000000001e-06,
"loss": 0.029,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7672955974842767,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7261904761904762,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.19099955260753632,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8447552447552448,
"eval_overall_precision": 0.8031914893617021,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.376,
"eval_samples_per_second": 497.396,
"eval_steps_per_second": 7.98,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.5256904363632202,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0272,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7530864197530864,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7011494252873564,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18842431902885437,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8356545961002785,
"eval_overall_precision": 0.7915567282321899,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3768,
"eval_samples_per_second": 496.302,
"eval_steps_per_second": 7.962,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 1.0590431690216064,
"learning_rate": 3e-06,
"loss": 0.0282,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9169435215946844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1881646066904068,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8423988842398884,
"eval_overall_precision": 0.798941798941799,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3781,
"eval_samples_per_second": 494.612,
"eval_steps_per_second": 7.935,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.05212884396314621,
"learning_rate": 2.5e-06,
"loss": 0.0288,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7625,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7176470588235294,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18959392607212067,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8368200836820084,
"eval_overall_precision": 0.7936507936507936,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3776,
"eval_samples_per_second": 495.273,
"eval_steps_per_second": 7.946,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.0768834576010704,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.028,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.910299003322259,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1877508908510208,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8423988842398884,
"eval_overall_precision": 0.798941798941799,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3767,
"eval_samples_per_second": 496.397,
"eval_steps_per_second": 7.964,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.8987697958946228,
"learning_rate": 1.5e-06,
"loss": 0.028,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.910299003322259,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1894301176071167,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8423988842398884,
"eval_overall_precision": 0.798941798941799,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.378,
"eval_samples_per_second": 494.727,
"eval_steps_per_second": 7.937,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.4777444303035736,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0275,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.910299003322259,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18901941180229187,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8435754189944135,
"eval_overall_precision": 0.8010610079575596,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3785,
"eval_samples_per_second": 494.002,
"eval_steps_per_second": 7.925,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 1.2922275066375732,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0269,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.910299003322259,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.19013750553131104,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8435754189944135,
"eval_overall_precision": 0.8010610079575596,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3764,
"eval_samples_per_second": 496.756,
"eval_steps_per_second": 7.969,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.2882828414440155,
"learning_rate": 0.0,
"loss": 0.0282,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.910299003322259,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.18969494104385376,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8435754189944135,
"eval_overall_precision": 0.8010610079575596,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3757,
"eval_samples_per_second": 497.683,
"eval_steps_per_second": 7.984,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5023623771566022.0,
"train_loss": 0.076274028116802,
"train_runtime": 617.4793,
"train_samples_per_second": 273.208,
"train_steps_per_second": 17.167
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5023623771566022.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}