nerugm-lora-r8-4 / trainer_state.json
apwic's picture
End of training
b63d8cb verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.6370744705200195,
"learning_rate": 4.9500000000000004e-05,
"loss": 1.2587,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.0,
"eval_PERSON_recall": 0.0,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.7307424545288086,
"eval_overall_accuracy": 0.8365739601279842,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_runtime": 0.3763,
"eval_samples_per_second": 496.93,
"eval_steps_per_second": 7.972,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 6.390524864196777,
"learning_rate": 4.9e-05,
"loss": 0.7063,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012820512820512822,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.16666666666666666,
"eval_PERSON_recall": 0.006666666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.6230493783950806,
"eval_overall_accuracy": 0.8375584543440807,
"eval_overall_f1": 0.005586592178770949,
"eval_overall_precision": 0.14285714285714285,
"eval_overall_recall": 0.002849002849002849,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.355,
"eval_steps_per_second": 8.043,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.1493935585021973,
"learning_rate": 4.85e-05,
"loss": 0.612,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.02631578947368421,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.3333333333333333,
"eval_LOCATION_recall": 0.0136986301369863,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.07100591715976332,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.3157894736842105,
"eval_PERSON_recall": 0.04,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5286092758178711,
"eval_overall_accuracy": 0.8437115431946838,
"eval_overall_f1": 0.036458333333333336,
"eval_overall_precision": 0.21212121212121213,
"eval_overall_recall": 0.019943019943019943,
"eval_runtime": 0.3703,
"eval_samples_per_second": 504.935,
"eval_steps_per_second": 8.101,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.3580924272537231,
"learning_rate": 4.8e-05,
"loss": 0.5187,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.16470588235294117,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5833333333333334,
"eval_LOCATION_recall": 0.0958904109589041,
"eval_ORGANIZATION_f1": 0.025641025641025644,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.07692307692307693,
"eval_ORGANIZATION_recall": 0.015384615384615385,
"eval_PERSON_f1": 0.2764227642276423,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.3541666666666667,
"eval_PERSON_recall": 0.22666666666666666,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.2692307692307692,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.3888888888888889,
"eval_TIME_recall": 0.20588235294117646,
"eval_loss": 0.42886805534362793,
"eval_overall_accuracy": 0.8700467634752646,
"eval_overall_f1": 0.2,
"eval_overall_precision": 0.35251798561151076,
"eval_overall_recall": 0.1396011396011396,
"eval_runtime": 0.3714,
"eval_samples_per_second": 503.492,
"eval_steps_per_second": 8.077,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.2623740434646606,
"learning_rate": 4.75e-05,
"loss": 0.4206,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.40650406504065034,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5,
"eval_LOCATION_recall": 0.3424657534246575,
"eval_ORGANIZATION_f1": 0.2692307692307693,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.358974358974359,
"eval_ORGANIZATION_recall": 0.2153846153846154,
"eval_PERSON_f1": 0.6900958466453674,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.6625766871165644,
"eval_PERSON_recall": 0.72,
"eval_QUANTITY_f1": 0.05405405405405405,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.125,
"eval_QUANTITY_recall": 0.034482758620689655,
"eval_TIME_f1": 0.5970149253731343,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6060606060606061,
"eval_TIME_recall": 0.5882352941176471,
"eval_loss": 0.34271273016929626,
"eval_overall_accuracy": 0.9094265321191238,
"eval_overall_f1": 0.5217391304347827,
"eval_overall_precision": 0.5733788395904437,
"eval_overall_recall": 0.47863247863247865,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.316,
"eval_steps_per_second": 8.043,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.2327097654342651,
"learning_rate": 4.7e-05,
"loss": 0.3388,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.567741935483871,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5365853658536586,
"eval_LOCATION_recall": 0.6027397260273972,
"eval_ORGANIZATION_f1": 0.4122137404580153,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4090909090909091,
"eval_ORGANIZATION_recall": 0.4153846153846154,
"eval_PERSON_f1": 0.7988165680473374,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7180851063829787,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.3934426229508197,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.375,
"eval_QUANTITY_recall": 0.41379310344827586,
"eval_TIME_f1": 0.7222222222222222,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6842105263157895,
"eval_TIME_recall": 0.7647058823529411,
"eval_loss": 0.2868286073207855,
"eval_overall_accuracy": 0.9271474280088604,
"eval_overall_f1": 0.6446499339498019,
"eval_overall_precision": 0.6009852216748769,
"eval_overall_recall": 0.6951566951566952,
"eval_runtime": 0.3765,
"eval_samples_per_second": 496.697,
"eval_steps_per_second": 7.968,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 6.483063697814941,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.2819,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.588957055214724,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5333333333333333,
"eval_LOCATION_recall": 0.6575342465753424,
"eval_ORGANIZATION_f1": 0.4142857142857143,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.38666666666666666,
"eval_ORGANIZATION_recall": 0.4461538461538462,
"eval_PERSON_f1": 0.8217522658610271,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7513812154696132,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.43750000000000006,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4,
"eval_QUANTITY_recall": 0.4827586206896552,
"eval_TIME_f1": 0.7397260273972601,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6923076923076923,
"eval_TIME_recall": 0.7941176470588235,
"eval_loss": 0.2394540160894394,
"eval_overall_accuracy": 0.9308392813192222,
"eval_overall_f1": 0.6588845654993515,
"eval_overall_precision": 0.6047619047619047,
"eval_overall_recall": 0.7236467236467237,
"eval_runtime": 0.3729,
"eval_samples_per_second": 501.505,
"eval_steps_per_second": 8.046,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 1.2606326341629028,
"learning_rate": 4.600000000000001e-05,
"loss": 0.2487,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.658682634730539,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5851063829787234,
"eval_LOCATION_recall": 0.7534246575342466,
"eval_ORGANIZATION_f1": 0.4827586206896552,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4375,
"eval_ORGANIZATION_recall": 0.5384615384615384,
"eval_PERSON_f1": 0.8292682926829269,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7640449438202247,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.41269841269841273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.38235294117647056,
"eval_QUANTITY_recall": 0.4482758620689655,
"eval_TIME_f1": 0.7297297297297296,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.675,
"eval_TIME_recall": 0.7941176470588235,
"eval_loss": 0.21583667397499084,
"eval_overall_accuracy": 0.9362539995077529,
"eval_overall_f1": 0.6846846846846847,
"eval_overall_precision": 0.6244131455399061,
"eval_overall_recall": 0.7578347578347578,
"eval_runtime": 0.3731,
"eval_samples_per_second": 501.231,
"eval_steps_per_second": 8.041,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 2.007969856262207,
"learning_rate": 4.55e-05,
"loss": 0.2255,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7023809523809524,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6210526315789474,
"eval_LOCATION_recall": 0.8082191780821918,
"eval_ORGANIZATION_f1": 0.5419354838709677,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4666666666666667,
"eval_ORGANIZATION_recall": 0.6461538461538462,
"eval_PERSON_f1": 0.8395061728395062,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7816091954022989,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.4262295081967213,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.40625,
"eval_QUANTITY_recall": 0.4482758620689655,
"eval_TIME_f1": 0.6933333333333332,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6341463414634146,
"eval_TIME_recall": 0.7647058823529411,
"eval_loss": 0.20087261497974396,
"eval_overall_accuracy": 0.9374846172778735,
"eval_overall_f1": 0.7049808429118773,
"eval_overall_precision": 0.6388888888888888,
"eval_overall_recall": 0.7863247863247863,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.448,
"eval_steps_per_second": 8.029,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.8239966630935669,
"learning_rate": 4.5e-05,
"loss": 0.2062,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7393939393939394,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6630434782608695,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.5822784810126582,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4946236559139785,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8363636363636363,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7666666666666667,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.5245901639344263,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.5517241379310345,
"eval_TIME_f1": 0.7567567567567567,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1920880824327469,
"eval_overall_accuracy": 0.9419148412503077,
"eval_overall_f1": 0.7335025380710659,
"eval_overall_precision": 0.6613272311212814,
"eval_overall_recall": 0.8233618233618234,
"eval_runtime": 0.3738,
"eval_samples_per_second": 500.32,
"eval_steps_per_second": 8.027,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.5922843217849731,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1965,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7100591715976331,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.625,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.5889570552147239,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4897959183673469,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8353658536585366,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7696629213483146,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.5538461538461539,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6206896551724138,
"eval_TIME_f1": 0.7272727272727273,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6511627906976745,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1852114200592041,
"eval_overall_accuracy": 0.9396997292640906,
"eval_overall_f1": 0.7256857855361597,
"eval_overall_precision": 0.6452328159645233,
"eval_overall_recall": 0.8290598290598291,
"eval_runtime": 0.3736,
"eval_samples_per_second": 500.574,
"eval_steps_per_second": 8.031,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.42921781539917,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1818,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7529411764705882,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6597938144329897,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.5853658536585367,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.48484848484848486,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8421052631578947,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7861271676300579,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.5074626865671642,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4473684210526316,
"eval_QUANTITY_recall": 0.5862068965517241,
"eval_TIME_f1": 0.7341772151898734,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6444444444444445,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1793593168258667,
"eval_overall_accuracy": 0.9419148412503077,
"eval_overall_f1": 0.7322540473225404,
"eval_overall_precision": 0.6504424778761062,
"eval_overall_recall": 0.8376068376068376,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.093,
"eval_steps_per_second": 8.055,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 1.1510792970657349,
"learning_rate": 4.35e-05,
"loss": 0.1747,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7560975609756097,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6813186813186813,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6233766233766234,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5393258426966292,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8369230769230769,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7771428571428571,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6031746031746031,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5588235294117647,
"eval_QUANTITY_recall": 0.6551724137931034,
"eval_TIME_f1": 0.767123287671233,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.717948717948718,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.16559341549873352,
"eval_overall_accuracy": 0.94683731233079,
"eval_overall_f1": 0.7522464698331193,
"eval_overall_precision": 0.6845794392523364,
"eval_overall_recall": 0.8347578347578347,
"eval_runtime": 0.3729,
"eval_samples_per_second": 501.412,
"eval_steps_per_second": 8.044,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.169286847114563,
"learning_rate": 4.3e-05,
"loss": 0.1723,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7701863354037267,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7045454545454546,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6012269938650306,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8500000000000001,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.5538461538461539,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6206896551724138,
"eval_TIME_f1": 0.717948717948718,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6363636363636364,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.16448074579238892,
"eval_overall_accuracy": 0.9456066945606695,
"eval_overall_f1": 0.7445997458703939,
"eval_overall_precision": 0.6720183486238532,
"eval_overall_recall": 0.8347578347578347,
"eval_runtime": 0.3743,
"eval_samples_per_second": 499.558,
"eval_steps_per_second": 8.014,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.2472301721572876,
"learning_rate": 4.25e-05,
"loss": 0.1626,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.75,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6631578947368421,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5052631578947369,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8473520249221183,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7953216374269005,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.5671641791044776,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6551724137931034,
"eval_TIME_f1": 0.7692307692307693,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6818181818181818,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.16658160090446472,
"eval_overall_accuracy": 0.9441299532365247,
"eval_overall_f1": 0.7455919395465995,
"eval_overall_precision": 0.6681715575620768,
"eval_overall_recall": 0.8433048433048433,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.282,
"eval_steps_per_second": 8.042,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.5230070352554321,
"learning_rate": 4.2e-05,
"loss": 0.1582,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7393939393939394,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6630434782608695,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6274509803921569,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5454545454545454,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8526645768025077,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8047337278106509,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6567164179104478,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5789473684210527,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7435897435897436,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6590909090909091,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.15897247195243835,
"eval_overall_accuracy": 0.9473295594388383,
"eval_overall_f1": 0.7570332480818415,
"eval_overall_precision": 0.6867749419953596,
"eval_overall_recall": 0.8433048433048433,
"eval_runtime": 0.3746,
"eval_samples_per_second": 499.228,
"eval_steps_per_second": 8.009,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.6365993618965149,
"learning_rate": 4.15e-05,
"loss": 0.1556,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7607361963190183,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6888888888888889,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6075949367088608,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5161290322580645,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8500000000000001,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6268656716417911,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5526315789473685,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.7692307692307693,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6818181818181818,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.16090132296085358,
"eval_overall_accuracy": 0.9470834358848141,
"eval_overall_f1": 0.7557251908396947,
"eval_overall_precision": 0.6827586206896552,
"eval_overall_recall": 0.8461538461538461,
"eval_runtime": 0.3703,
"eval_samples_per_second": 505.047,
"eval_steps_per_second": 8.102,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 1.4139217138290405,
"learning_rate": 4.1e-05,
"loss": 0.1521,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7701863354037267,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7045454545454546,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6193548387096774,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5333333333333333,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8616352201257862,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8154761904761905,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6363636363636365,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5675675675675675,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15284273028373718,
"eval_overall_accuracy": 0.9497907949790795,
"eval_overall_f1": 0.7696267696267697,
"eval_overall_precision": 0.7018779342723005,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.701,
"eval_steps_per_second": 8.081,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.8368671536445618,
"learning_rate": 4.05e-05,
"loss": 0.1507,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6289308176100629,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5319148936170213,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8490566037735849,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8035714285714286,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6060606060606061,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5405405405405406,
"eval_QUANTITY_recall": 0.6896551724137931,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15364685654640198,
"eval_overall_accuracy": 0.9490524243170071,
"eval_overall_f1": 0.764102564102564,
"eval_overall_precision": 0.6946386946386947,
"eval_overall_recall": 0.8490028490028491,
"eval_runtime": 0.3717,
"eval_samples_per_second": 503.112,
"eval_steps_per_second": 8.071,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.1445201635360718,
"learning_rate": 4e-05,
"loss": 0.1426,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6216216216216216,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5542168674698795,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8544303797468354,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8132530120481928,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.5757575757575758,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5135135135135135,
"eval_QUANTITY_recall": 0.6551724137931034,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14918731153011322,
"eval_overall_accuracy": 0.9500369185331036,
"eval_overall_f1": 0.7640156453715775,
"eval_overall_precision": 0.7043269230769231,
"eval_overall_recall": 0.8347578347578347,
"eval_runtime": 0.3707,
"eval_samples_per_second": 504.495,
"eval_steps_per_second": 8.094,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.6204472780227661,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.1406,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7875,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6308724832214766,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5595238095238095,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8454258675078864,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8023952095808383,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.6060606060606061,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5405405405405406,
"eval_QUANTITY_recall": 0.6896551724137931,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14743082225322723,
"eval_overall_accuracy": 0.9524981540733448,
"eval_overall_f1": 0.7682291666666666,
"eval_overall_precision": 0.7074340527577938,
"eval_overall_recall": 0.8404558404558404,
"eval_runtime": 0.3736,
"eval_samples_per_second": 500.485,
"eval_steps_per_second": 8.029,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 1.1964826583862305,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.1375,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.7682926829268293,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6923076923076923,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6163522012578616,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5212765957446809,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8500000000000001,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6363636363636365,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5675675675675675,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15313014388084412,
"eval_overall_accuracy": 0.9478218065468865,
"eval_overall_f1": 0.7633587786259542,
"eval_overall_precision": 0.6896551724137931,
"eval_overall_recall": 0.8547008547008547,
"eval_runtime": 0.3721,
"eval_samples_per_second": 502.581,
"eval_steps_per_second": 8.063,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 1.223521113395691,
"learning_rate": 3.85e-05,
"loss": 0.1359,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6455696202531646,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5483870967741935,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8580441640378549,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8143712574850299,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6363636363636365,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5675675675675675,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8311688311688312,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7441860465116279,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1469704806804657,
"eval_overall_accuracy": 0.9527442776273689,
"eval_overall_f1": 0.7783505154639175,
"eval_overall_precision": 0.7105882352941176,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.165,
"eval_steps_per_second": 8.056,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.477795958518982,
"learning_rate": 3.8e-05,
"loss": 0.1326,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7901234567901235,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7191011235955056,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6363636363636364,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.550561797752809,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8634920634920634,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8242424242424242,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15083272755146027,
"eval_overall_accuracy": 0.9517597834112724,
"eval_overall_f1": 0.7803617571059431,
"eval_overall_precision": 0.7139479905437353,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3717,
"eval_samples_per_second": 503.084,
"eval_steps_per_second": 8.071,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 1.213571310043335,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.1278,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7730061349693251,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6289308176100629,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5319148936170213,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8634920634920634,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8242424242424242,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1542501598596573,
"eval_overall_accuracy": 0.9492985478710313,
"eval_overall_f1": 0.7759282970550576,
"eval_overall_precision": 0.7046511627906977,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.402,
"eval_steps_per_second": 8.044,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 1.678344488143921,
"learning_rate": 3.7e-05,
"loss": 0.1302,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6040268456375838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5357142857142857,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8544303797468354,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8132530120481928,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14476777613162994,
"eval_overall_accuracy": 0.9505291656411519,
"eval_overall_f1": 0.7660130718954249,
"eval_overall_precision": 0.7077294685990339,
"eval_overall_recall": 0.8347578347578347,
"eval_runtime": 0.3715,
"eval_samples_per_second": 503.403,
"eval_steps_per_second": 8.076,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 1.0448905229568481,
"learning_rate": 3.65e-05,
"loss": 0.1266,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6308724832214766,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5595238095238095,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14498956501483917,
"eval_overall_accuracy": 0.9527442776273689,
"eval_overall_f1": 0.7801047120418848,
"eval_overall_precision": 0.7215496368038741,
"eval_overall_recall": 0.8490028490028491,
"eval_runtime": 0.3706,
"eval_samples_per_second": 504.535,
"eval_steps_per_second": 8.094,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.1935324668884277,
"learning_rate": 3.6e-05,
"loss": 0.1244,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7607361963190183,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6888888888888889,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6490066225165563,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5697674418604651,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6567164179104478,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5789473684210527,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7792207792207793,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6976744186046512,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14751355350017548,
"eval_overall_accuracy": 0.9520059069652966,
"eval_overall_f1": 0.7772020725388602,
"eval_overall_precision": 0.7125890736342043,
"eval_overall_recall": 0.8547008547008547,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.765,
"eval_steps_per_second": 8.082,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 1.6158292293548584,
"learning_rate": 3.55e-05,
"loss": 0.1223,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.7852760736196318,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7111111111111111,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6363636363636364,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.550561797752809,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6363636363636365,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5675675675675675,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.7792207792207793,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6976744186046512,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.15049177408218384,
"eval_overall_accuracy": 0.950775289195176,
"eval_overall_f1": 0.7777777777777778,
"eval_overall_precision": 0.7115839243498818,
"eval_overall_recall": 0.8575498575498576,
"eval_runtime": 0.3729,
"eval_samples_per_second": 501.493,
"eval_steps_per_second": 8.045,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 4.963561534881592,
"learning_rate": 3.5e-05,
"loss": 0.1216,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6388888888888888,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5822784810126582,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8634920634920634,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8242424242424242,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6349206349206349,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5882352941176471,
"eval_QUANTITY_recall": 0.6896551724137931,
"eval_TIME_f1": 0.8767123287671232,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8205128205128205,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14033010601997375,
"eval_overall_accuracy": 0.9537287718434654,
"eval_overall_f1": 0.7835325365205843,
"eval_overall_precision": 0.7338308457711443,
"eval_overall_recall": 0.8404558404558404,
"eval_runtime": 0.3709,
"eval_samples_per_second": 504.137,
"eval_steps_per_second": 8.088,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.5298508405685425,
"learning_rate": 3.45e-05,
"loss": 0.1197,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6394557823129251,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.573170731707317,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1418294459581375,
"eval_overall_accuracy": 0.9534826482894413,
"eval_overall_f1": 0.787878787878788,
"eval_overall_precision": 0.7328431372549019,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3711,
"eval_samples_per_second": 503.888,
"eval_steps_per_second": 8.084,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 2.2755866050720215,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.1175,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6535947712418302,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5681818181818182,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14501163363456726,
"eval_overall_accuracy": 0.9527442776273689,
"eval_overall_f1": 0.7854356306892067,
"eval_overall_precision": 0.722488038277512,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3706,
"eval_samples_per_second": 504.644,
"eval_steps_per_second": 8.096,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.624603033065796,
"learning_rate": 3.35e-05,
"loss": 0.1178,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6266666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5529411764705883,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8634920634920634,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8242424242424242,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14197108149528503,
"eval_overall_accuracy": 0.9520059069652966,
"eval_overall_f1": 0.7816993464052289,
"eval_overall_precision": 0.7222222222222222,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.895,
"eval_steps_per_second": 8.036,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.45547616481781,
"learning_rate": 3.3e-05,
"loss": 0.1142,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6351351351351351,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5662650602409639,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14198823273181915,
"eval_overall_accuracy": 0.9532365247354172,
"eval_overall_f1": 0.7837483617300132,
"eval_overall_precision": 0.7257281553398058,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.726,
"eval_steps_per_second": 8.081,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.698808193206787,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.1159,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7875,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.64,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5647058823529412,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14497017860412598,
"eval_overall_accuracy": 0.9532365247354172,
"eval_overall_f1": 0.7890625,
"eval_overall_precision": 0.7266187050359713,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.372,
"eval_samples_per_second": 502.715,
"eval_steps_per_second": 8.065,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.9385290741920471,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.1131,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7777777777777778,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7078651685393258,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6490066225165563,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5697674418604651,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14353057742118835,
"eval_overall_accuracy": 0.9539748953974896,
"eval_overall_f1": 0.78748370273794,
"eval_overall_precision": 0.7259615384615384,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3701,
"eval_samples_per_second": 505.324,
"eval_steps_per_second": 8.107,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 1.1011046171188354,
"learning_rate": 3.15e-05,
"loss": 0.113,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7701863354037267,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7045454545454546,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.638036809815951,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5306122448979592,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8616352201257862,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8154761904761905,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6470588235294118,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5641025641025641,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7792207792207793,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6976744186046512,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.15234865248203278,
"eval_overall_accuracy": 0.9492985478710313,
"eval_overall_f1": 0.7700127064803051,
"eval_overall_precision": 0.694954128440367,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.679,
"eval_steps_per_second": 8.08,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.7849928736686707,
"learning_rate": 3.1e-05,
"loss": 0.1122,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6527777777777777,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5949367088607594,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8643533123028392,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8203592814371258,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14123748242855072,
"eval_overall_accuracy": 0.9534826482894413,
"eval_overall_f1": 0.7831800262812089,
"eval_overall_precision": 0.7268292682926829,
"eval_overall_recall": 0.8490028490028491,
"eval_runtime": 0.3726,
"eval_samples_per_second": 501.941,
"eval_steps_per_second": 8.053,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 3.6088364124298096,
"learning_rate": 3.05e-05,
"loss": 0.1097,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.7875,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.641025641025641,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5494505494505495,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14366811513900757,
"eval_overall_accuracy": 0.9532365247354172,
"eval_overall_f1": 0.7855297157622738,
"eval_overall_precision": 0.7186761229314421,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3719,
"eval_samples_per_second": 502.835,
"eval_steps_per_second": 8.067,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.650290846824646,
"learning_rate": 3e-05,
"loss": 0.1098,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6490066225165563,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5697674418604651,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14134834706783295,
"eval_overall_accuracy": 0.9539748953974896,
"eval_overall_f1": 0.7848761408083441,
"eval_overall_precision": 0.7235576923076923,
"eval_overall_recall": 0.8575498575498576,
"eval_runtime": 0.374,
"eval_samples_per_second": 500.058,
"eval_steps_per_second": 8.022,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 1.017473816871643,
"learning_rate": 2.95e-05,
"loss": 0.1078,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7974683544303799,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6533333333333333,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5764705882352941,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8598726114649682,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.823170731707317,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6567164179104478,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5789473684210527,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14262568950653076,
"eval_overall_accuracy": 0.9534826482894413,
"eval_overall_f1": 0.7816993464052289,
"eval_overall_precision": 0.7222222222222222,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.78,
"eval_steps_per_second": 8.05,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.8548632264137268,
"learning_rate": 2.9e-05,
"loss": 0.1095,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.7875,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6369426751592356,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5434782608695652,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8626198083067093,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6086956521739131,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.525,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1465131938457489,
"eval_overall_accuracy": 0.9524981540733448,
"eval_overall_f1": 0.7716129032258064,
"eval_overall_precision": 0.7051886792452831,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.757,
"eval_steps_per_second": 8.05,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.9329050183296204,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.1082,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6530612244897959,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5853658536585366,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14095118641853333,
"eval_overall_accuracy": 0.9542210189515137,
"eval_overall_f1": 0.7843137254901961,
"eval_overall_precision": 0.7246376811594203,
"eval_overall_recall": 0.8547008547008547,
"eval_runtime": 0.3721,
"eval_samples_per_second": 502.528,
"eval_steps_per_second": 8.062,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 3.2247750759124756,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.1065,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6530612244897959,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5853658536585366,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8607594936708859,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8192771084337349,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13867002725601196,
"eval_overall_accuracy": 0.9542210189515137,
"eval_overall_f1": 0.7837483617300132,
"eval_overall_precision": 0.7257281553398058,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3721,
"eval_samples_per_second": 502.486,
"eval_steps_per_second": 8.061,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 3.5815913677215576,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.1058,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8050314465408805,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7441860465116279,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5975609756097561,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13923799991607666,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.7942332896461337,
"eval_overall_precision": 0.7354368932038835,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.88,
"eval_steps_per_second": 8.1,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 2.907482624053955,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.1033,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6530612244897959,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5853658536585366,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.65625,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1363789588212967,
"eval_overall_accuracy": 0.9542210189515137,
"eval_overall_f1": 0.7857142857142856,
"eval_overall_precision": 0.7333333333333333,
"eval_overall_recall": 0.8461538461538461,
"eval_runtime": 0.3755,
"eval_samples_per_second": 497.945,
"eval_steps_per_second": 7.988,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 1.325737714767456,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.1057,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7875,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6533333333333333,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5764705882352941,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1410611867904663,
"eval_overall_accuracy": 0.9547132660595619,
"eval_overall_f1": 0.788036410923277,
"eval_overall_precision": 0.7248803827751196,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3717,
"eval_samples_per_second": 503.064,
"eval_steps_per_second": 8.071,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 6.672816753387451,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.1062,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8050314465408805,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7441860465116279,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6712328767123288,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6049382716049383,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8769716088328076,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8323353293413174,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14320684969425201,
"eval_overall_accuracy": 0.9547132660595619,
"eval_overall_f1": 0.7973856209150327,
"eval_overall_precision": 0.7367149758454107,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.285,
"eval_steps_per_second": 8.042,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.6894783973693848,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.1006,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5975609756097561,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14069923758506775,
"eval_overall_accuracy": 0.9552055131676102,
"eval_overall_f1": 0.7926509186351706,
"eval_overall_precision": 0.7347931873479319,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3698,
"eval_samples_per_second": 505.727,
"eval_steps_per_second": 8.113,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.443442463874817,
"learning_rate": 2.5e-05,
"loss": 0.1004,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8050314465408805,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7441860465116279,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6622516556291391,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5813953488372093,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6363636363636365,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5675675675675675,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14033810794353485,
"eval_overall_accuracy": 0.9544671425055378,
"eval_overall_f1": 0.7916666666666666,
"eval_overall_precision": 0.7290167865707434,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3746,
"eval_samples_per_second": 499.192,
"eval_steps_per_second": 8.008,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 1.2972335815429688,
"learning_rate": 2.45e-05,
"loss": 0.1004,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6577181208053692,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5833333333333334,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13990922272205353,
"eval_overall_accuracy": 0.9544671425055378,
"eval_overall_f1": 0.7843137254901961,
"eval_overall_precision": 0.7246376811594203,
"eval_overall_recall": 0.8547008547008547,
"eval_runtime": 0.3718,
"eval_samples_per_second": 502.948,
"eval_steps_per_second": 8.069,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 1.4539422988891602,
"learning_rate": 2.4e-05,
"loss": 0.1,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6621621621621622,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5903614457831325,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14225150644779205,
"eval_overall_accuracy": 0.9542210189515137,
"eval_overall_f1": 0.7900912646675359,
"eval_overall_precision": 0.7283653846153846,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3752,
"eval_samples_per_second": 498.425,
"eval_steps_per_second": 7.996,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.7125135660171509,
"learning_rate": 2.35e-05,
"loss": 0.099,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6375000000000001,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5368421052631579,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7792207792207793,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6976744186046512,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1469447910785675,
"eval_overall_accuracy": 0.9524981540733448,
"eval_overall_f1": 0.7769230769230769,
"eval_overall_precision": 0.7062937062937062,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3719,
"eval_samples_per_second": 502.81,
"eval_steps_per_second": 8.066,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 1.7067456245422363,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0966,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6580645161290322,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5666666666666667,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8662420382165605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8292682926829268,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1407339721918106,
"eval_overall_accuracy": 0.9527442776273689,
"eval_overall_f1": 0.7802340702210663,
"eval_overall_precision": 0.7177033492822966,
"eval_overall_recall": 0.8547008547008547,
"eval_runtime": 0.3741,
"eval_samples_per_second": 499.806,
"eval_steps_per_second": 8.018,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 1.2333046197891235,
"learning_rate": 2.25e-05,
"loss": 0.0993,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6540880503144655,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5531914893617021,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6470588235294118,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5641025641025641,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1426202952861786,
"eval_overall_accuracy": 0.9539748953974896,
"eval_overall_f1": 0.7845161290322581,
"eval_overall_precision": 0.7169811320754716,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.417,
"eval_steps_per_second": 8.06,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 2.1034226417541504,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0987,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6710526315789473,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5862068965517241,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1402589976787567,
"eval_overall_accuracy": 0.9547132660595619,
"eval_overall_f1": 0.7916666666666666,
"eval_overall_precision": 0.7290167865707434,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3796,
"eval_samples_per_second": 492.597,
"eval_steps_per_second": 7.903,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.6643573641777039,
"learning_rate": 2.15e-05,
"loss": 0.0994,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.65,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5473684210526316,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14331957697868347,
"eval_overall_accuracy": 0.9529904011813931,
"eval_overall_f1": 0.788586251621271,
"eval_overall_precision": 0.7238095238095238,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3723,
"eval_samples_per_second": 502.313,
"eval_steps_per_second": 8.058,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.6412150263786316,
"learning_rate": 2.1e-05,
"loss": 0.0975,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5714285714285714,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14041897654533386,
"eval_overall_accuracy": 0.9539748953974896,
"eval_overall_f1": 0.7926988265971318,
"eval_overall_precision": 0.7307692307692307,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.287,
"eval_steps_per_second": 8.09,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 1.8468962907791138,
"learning_rate": 2.05e-05,
"loss": 0.0976,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6891891891891891,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6144578313253012,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13591574132442474,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.7994722955145119,
"eval_overall_precision": 0.7444717444717445,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3721,
"eval_samples_per_second": 502.524,
"eval_steps_per_second": 8.062,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 1.731353998184204,
"learning_rate": 2e-05,
"loss": 0.0964,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.697986577181208,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1385490745306015,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.7952755905511811,
"eval_overall_precision": 0.7372262773722628,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3703,
"eval_samples_per_second": 505.036,
"eval_steps_per_second": 8.102,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.1987533569335938,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0954,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.697986577181208,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.135517880320549,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.7968337730870712,
"eval_overall_precision": 0.742014742014742,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.389,
"eval_steps_per_second": 8.044,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 4.096658706665039,
"learning_rate": 1.9e-05,
"loss": 0.0938,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1392134130001068,
"eval_overall_accuracy": 0.9559438838296825,
"eval_overall_f1": 0.8015873015873016,
"eval_overall_precision": 0.7481481481481481,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.603,
"eval_steps_per_second": 8.079,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 3.0589916706085205,
"learning_rate": 1.85e-05,
"loss": 0.0935,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6022727272727273,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14185936748981476,
"eval_overall_accuracy": 0.9542210189515137,
"eval_overall_f1": 0.7937336814621411,
"eval_overall_precision": 0.7325301204819277,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3743,
"eval_samples_per_second": 499.638,
"eval_steps_per_second": 8.016,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 1.2135686874389648,
"learning_rate": 1.8e-05,
"loss": 0.0943,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13513682782649994,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8084544253632759,
"eval_overall_precision": 0.7536945812807881,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3734,
"eval_samples_per_second": 500.828,
"eval_steps_per_second": 8.035,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 1.0723731517791748,
"learning_rate": 1.75e-05,
"loss": 0.093,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.137324720621109,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.8026315789473685,
"eval_overall_precision": 0.7457212713936431,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3728,
"eval_samples_per_second": 501.578,
"eval_steps_per_second": 8.047,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.8052380084991455,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0922,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7074829931972789,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6341463414634146,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13625451922416687,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8073878627968336,
"eval_overall_precision": 0.7518427518427518,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.355,
"eval_steps_per_second": 8.059,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 1.3482667207717896,
"learning_rate": 1.65e-05,
"loss": 0.0912,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.802547770700637,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13759839534759521,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.804749340369393,
"eval_overall_precision": 0.7493857493857494,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3726,
"eval_samples_per_second": 501.886,
"eval_steps_per_second": 8.052,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 1.3148181438446045,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0908,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7162162162162162,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13887125253677368,
"eval_overall_accuracy": 0.9559438838296825,
"eval_overall_f1": 0.8031704095112285,
"eval_overall_precision": 0.7487684729064039,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3725,
"eval_samples_per_second": 501.982,
"eval_steps_per_second": 8.053,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 1.0154967308044434,
"learning_rate": 1.55e-05,
"loss": 0.0905,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1376219391822815,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.8063241106719368,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.988,
"eval_steps_per_second": 8.037,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.1361740827560425,
"learning_rate": 1.5e-05,
"loss": 0.0913,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6986301369863014,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6296296296296297,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13397939503192902,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.8015873015873016,
"eval_overall_precision": 0.7481481481481481,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3748,
"eval_samples_per_second": 498.915,
"eval_steps_per_second": 8.004,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 2.124069929122925,
"learning_rate": 1.45e-05,
"loss": 0.0916,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7058823529411765,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6136363636363636,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13961876928806305,
"eval_overall_accuracy": 0.9552055131676102,
"eval_overall_f1": 0.8062827225130891,
"eval_overall_precision": 0.7457627118644068,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3756,
"eval_samples_per_second": 497.843,
"eval_steps_per_second": 7.987,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.8449153304100037,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0902,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13548322021961212,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8095238095238095,
"eval_overall_precision": 0.7555555555555555,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3739,
"eval_samples_per_second": 500.097,
"eval_steps_per_second": 8.023,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.425387978553772,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0912,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1355520486831665,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8095238095238095,
"eval_overall_precision": 0.7555555555555555,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3723,
"eval_samples_per_second": 502.274,
"eval_steps_per_second": 8.058,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.236484408378601,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0892,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6901408450704226,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13207848370075226,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8053333333333333,
"eval_overall_precision": 0.7568922305764411,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3736,
"eval_samples_per_second": 500.6,
"eval_steps_per_second": 8.031,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.7426979541778564,
"learning_rate": 1.25e-05,
"loss": 0.0895,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7083333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6455696202531646,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1352306306362152,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.8100929614873837,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.915,
"eval_steps_per_second": 8.036,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 1.0712276697158813,
"learning_rate": 1.2e-05,
"loss": 0.0905,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13476784527301788,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.8063660477453581,
"eval_overall_precision": 0.7543424317617866,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.104,
"eval_steps_per_second": 8.055,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 8.184710502624512,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0895,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13437636196613312,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8127490039840637,
"eval_overall_precision": 0.7611940298507462,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.407,
"eval_steps_per_second": 8.028,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 1.3736040592193604,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0882,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13567619025707245,
"eval_overall_accuracy": 0.9574206251538272,
"eval_overall_f1": 0.8143236074270558,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.707,
"eval_steps_per_second": 8.049,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.9239408373832703,
"learning_rate": 1.05e-05,
"loss": 0.0877,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1406855285167694,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.807843137254902,
"eval_overall_precision": 0.7463768115942029,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3738,
"eval_samples_per_second": 500.304,
"eval_steps_per_second": 8.026,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.7240285873413086,
"learning_rate": 1e-05,
"loss": 0.0876,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13832524418830872,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.8100263852242744,
"eval_overall_precision": 0.7542997542997543,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3732,
"eval_samples_per_second": 501.071,
"eval_steps_per_second": 8.039,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.5305002331733704,
"learning_rate": 9.5e-06,
"loss": 0.0865,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13635414838790894,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8158940397350993,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.376,
"eval_samples_per_second": 497.277,
"eval_steps_per_second": 7.978,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.9057809114456177,
"learning_rate": 9e-06,
"loss": 0.0882,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13461817800998688,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8148148148148149,
"eval_overall_precision": 0.7604938271604939,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3748,
"eval_samples_per_second": 498.989,
"eval_steps_per_second": 8.005,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 1.2383646965026855,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0868,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13708707690238953,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8126649076517152,
"eval_overall_precision": 0.7567567567567568,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3728,
"eval_samples_per_second": 501.629,
"eval_steps_per_second": 8.048,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 1.3145028352737427,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0884,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13608714938163757,
"eval_overall_accuracy": 0.9574206251538272,
"eval_overall_f1": 0.8148148148148149,
"eval_overall_precision": 0.7604938271604939,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3781,
"eval_samples_per_second": 494.604,
"eval_steps_per_second": 7.935,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 3.6917648315429688,
"learning_rate": 7.5e-06,
"loss": 0.088,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13677531480789185,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8121693121693121,
"eval_overall_precision": 0.7580246913580246,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3775,
"eval_samples_per_second": 495.354,
"eval_steps_per_second": 7.947,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.643048107624054,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0869,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1348443627357483,
"eval_overall_accuracy": 0.9574206251538272,
"eval_overall_f1": 0.8132450331125828,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3768,
"eval_samples_per_second": 496.319,
"eval_steps_per_second": 7.962,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.7794643044471741,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0861,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1349503993988037,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8158940397350993,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3735,
"eval_samples_per_second": 500.607,
"eval_steps_per_second": 8.031,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.9696281552314758,
"learning_rate": 6e-06,
"loss": 0.0853,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1358775496482849,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8158940397350993,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3762,
"eval_samples_per_second": 497.14,
"eval_steps_per_second": 7.976,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 1.8147895336151123,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0873,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1357378214597702,
"eval_overall_accuracy": 0.9574206251538272,
"eval_overall_f1": 0.8169761273209548,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3747,
"eval_samples_per_second": 499.024,
"eval_steps_per_second": 8.006,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.6982191801071167,
"learning_rate": 5e-06,
"loss": 0.0869,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13445889949798584,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8169761273209548,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3744,
"eval_samples_per_second": 499.404,
"eval_steps_per_second": 8.012,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 1.2758022546768188,
"learning_rate": 4.5e-06,
"loss": 0.0855,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7248322147651007,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13598185777664185,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8137384412153237,
"eval_overall_precision": 0.7586206896551724,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.966,
"eval_steps_per_second": 8.037,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 1.1231157779693604,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0863,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13555923104286194,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8158940397350993,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.907,
"eval_steps_per_second": 8.036,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 3.048227071762085,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0858,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13597699999809265,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8158940397350993,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3756,
"eval_samples_per_second": 497.847,
"eval_steps_per_second": 7.987,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 1.3223367929458618,
"learning_rate": 3e-06,
"loss": 0.0857,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13530442118644714,
"eval_overall_accuracy": 0.9574206251538272,
"eval_overall_f1": 0.8169761273209548,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3728,
"eval_samples_per_second": 501.55,
"eval_steps_per_second": 8.046,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 2.3395557403564453,
"learning_rate": 2.5e-06,
"loss": 0.0862,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1362064629793167,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8132450331125828,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3718,
"eval_samples_per_second": 502.962,
"eval_steps_per_second": 8.069,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 1.0705591440200806,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0864,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13568849861621857,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8132450331125828,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3725,
"eval_samples_per_second": 502.042,
"eval_steps_per_second": 8.054,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.9012406468391418,
"learning_rate": 1.5e-06,
"loss": 0.0849,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13571688532829285,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8132450331125828,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3741,
"eval_samples_per_second": 499.84,
"eval_steps_per_second": 8.019,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.9204326868057251,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0836,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13613446056842804,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.8105960264900662,
"eval_overall_precision": 0.7574257425742574,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3746,
"eval_samples_per_second": 499.155,
"eval_steps_per_second": 8.008,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 1.0252379179000854,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0831,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13595184683799744,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8105960264900662,
"eval_overall_precision": 0.7574257425742574,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.665,
"eval_steps_per_second": 8.08,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 1.394977331161499,
"learning_rate": 0.0,
"loss": 0.085,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7397260273972603,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1360514611005783,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.8105960264900662,
"eval_overall_precision": 0.7574257425742574,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3715,
"eval_samples_per_second": 503.418,
"eval_steps_per_second": 8.076,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4535917761443712.0,
"train_loss": 0.14489822162772126,
"train_runtime": 603.3251,
"train_samples_per_second": 279.783,
"train_steps_per_second": 17.569
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4535917761443712.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}