nerugm-pt-pl50-4 / trainer_state.json
apwic's picture
End of training
513ed94 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.875795841217041,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9784,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.024390243902439025,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.14285714285714285,
"eval_PERSON_recall": 0.013333333333333334,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5909550189971924,
"eval_overall_accuracy": 0.8392813192222496,
"eval_overall_f1": 0.010638297872340425,
"eval_overall_precision": 0.08,
"eval_overall_recall": 0.005698005698005698,
"eval_runtime": 0.3532,
"eval_samples_per_second": 529.423,
"eval_steps_per_second": 8.493,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.4692219495773315,
"learning_rate": 4.9e-05,
"loss": 0.4893,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.4444444444444445,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5909090909090909,
"eval_LOCATION_recall": 0.3561643835616438,
"eval_ORGANIZATION_f1": 0.12328767123287672,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.1111111111111111,
"eval_ORGANIZATION_recall": 0.13846153846153847,
"eval_PERSON_f1": 0.6703910614525139,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.5769230769230769,
"eval_PERSON_recall": 0.8,
"eval_QUANTITY_f1": 0.2857142857142857,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.2962962962962963,
"eval_QUANTITY_recall": 0.27586206896551724,
"eval_TIME_f1": 0.6301369863013699,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.5897435897435898,
"eval_TIME_recall": 0.6764705882352942,
"eval_loss": 0.35233741998672485,
"eval_overall_accuracy": 0.9020428254984002,
"eval_overall_f1": 0.496,
"eval_overall_precision": 0.46616541353383456,
"eval_overall_recall": 0.5299145299145299,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.772,
"eval_steps_per_second": 8.579,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 0.853384792804718,
"learning_rate": 4.85e-05,
"loss": 0.2876,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.6242038216560509,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5833333333333334,
"eval_LOCATION_recall": 0.6712328767123288,
"eval_ORGANIZATION_f1": 0.4090909090909091,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.40298507462686567,
"eval_ORGANIZATION_recall": 0.4153846153846154,
"eval_PERSON_f1": 0.8500000000000001,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6268656716417911,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5526315789473685,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.19235990941524506,
"eval_overall_accuracy": 0.9369923701698253,
"eval_overall_f1": 0.7050938337801608,
"eval_overall_precision": 0.6658227848101266,
"eval_overall_recall": 0.7492877492877493,
"eval_runtime": 0.3493,
"eval_samples_per_second": 535.38,
"eval_steps_per_second": 8.589,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 0.8233245015144348,
"learning_rate": 4.8e-05,
"loss": 0.2003,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.7295597484276729,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6744186046511628,
"eval_LOCATION_recall": 0.7945205479452054,
"eval_ORGANIZATION_f1": 0.6144578313253013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.504950495049505,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7042253521126761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5952380952380952,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.16705787181854248,
"eval_overall_accuracy": 0.9414225941422594,
"eval_overall_f1": 0.7704081632653061,
"eval_overall_precision": 0.6974595842956121,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.517,
"eval_steps_per_second": 8.591,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.155442476272583,
"learning_rate": 4.75e-05,
"loss": 0.1732,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6011560693641619,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.48148148148148145,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7594936708860759,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.15311911702156067,
"eval_overall_accuracy": 0.94683731233079,
"eval_overall_f1": 0.7670886075949367,
"eval_overall_precision": 0.6902050113895216,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.75,
"eval_steps_per_second": 8.579,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.4915152788162231,
"learning_rate": 4.7e-05,
"loss": 0.1556,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7560975609756097,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6813186813186813,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5094339622641509,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.631578947368421,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5106382978723404,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.6829268292682927,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.5833333333333334,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.17121362686157227,
"eval_overall_accuracy": 0.9396997292640906,
"eval_overall_f1": 0.758364312267658,
"eval_overall_precision": 0.6710526315789473,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3488,
"eval_samples_per_second": 536.19,
"eval_steps_per_second": 8.602,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.9724661111831665,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1437,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6623376623376623,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5730337078651685,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14172205328941345,
"eval_overall_accuracy": 0.9534826482894413,
"eval_overall_f1": 0.7948051948051948,
"eval_overall_precision": 0.7303102625298329,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3495,
"eval_samples_per_second": 534.982,
"eval_steps_per_second": 8.583,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.9051221609115601,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1338,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7590361445783131,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6774193548387096,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7532467532467532,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6744186046511628,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14630907773971558,
"eval_overall_accuracy": 0.9529904011813931,
"eval_overall_f1": 0.7902187902187902,
"eval_overall_precision": 0.7206572769953051,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3496,
"eval_samples_per_second": 534.867,
"eval_steps_per_second": 8.581,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.2815150022506714,
"learning_rate": 4.55e-05,
"loss": 0.1237,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.670886075949367,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5698924731182796,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1243952140212059,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8073878627968336,
"eval_overall_precision": 0.7518427518427518,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3487,
"eval_samples_per_second": 536.261,
"eval_steps_per_second": 8.603,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.8149334788322449,
"learning_rate": 4.5e-05,
"loss": 0.1189,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6751592356687899,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5760869565217391,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13834965229034424,
"eval_overall_accuracy": 0.9532365247354172,
"eval_overall_f1": 0.8015768725361366,
"eval_overall_precision": 0.7439024390243902,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3499,
"eval_samples_per_second": 534.481,
"eval_steps_per_second": 8.575,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.1204177141189575,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1139,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.8235294117647058,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6620689655172414,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7837837837837837,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.725,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14040923118591309,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.8053333333333333,
"eval_overall_precision": 0.7568922305764411,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.351,
"eval_samples_per_second": 532.751,
"eval_steps_per_second": 8.547,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.1477428674697876,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1056,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7058823529411765,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6136363636363636,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8055555555555555,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7631578947368421,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.13301722705364227,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.8131578947368421,
"eval_overall_precision": 0.7555012224938875,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.587,
"eval_steps_per_second": 8.592,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.6786032319068909,
"learning_rate": 4.35e-05,
"loss": 0.1032,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.675,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5684210526315789,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1293208748102188,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.811023622047244,
"eval_overall_precision": 0.7518248175182481,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.51,
"eval_steps_per_second": 8.607,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.0159380435943604,
"learning_rate": 4.3e-05,
"loss": 0.1013,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7973856209150326,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7777777777777778,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.14084841310977936,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.7978436657681941,
"eval_overall_precision": 0.7570332480818415,
"eval_overall_recall": 0.8433048433048433,
"eval_runtime": 0.3493,
"eval_samples_per_second": 535.324,
"eval_steps_per_second": 8.588,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.4810669422149658,
"learning_rate": 4.25e-05,
"loss": 0.0926,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6794871794871795,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5824175824175825,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.13149809837341309,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8179419525065963,
"eval_overall_precision": 0.7616707616707616,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.35,
"eval_samples_per_second": 534.326,
"eval_steps_per_second": 8.572,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.0576220750808716,
"learning_rate": 4.2e-05,
"loss": 0.0913,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8157894736842105,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7083333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6455696202531646,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6575342465753425,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.767123287671233,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.717948717948718,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.14829330146312714,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.8058124174372523,
"eval_overall_precision": 0.7512315270935961,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.349,
"eval_samples_per_second": 535.785,
"eval_steps_per_second": 8.595,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.3293265998363495,
"learning_rate": 4.15e-05,
"loss": 0.0888,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.7567567567567567,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.13628779351711273,
"eval_overall_accuracy": 0.9584051193699237,
"eval_overall_f1": 0.8197596795727637,
"eval_overall_precision": 0.7713567839195979,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3508,
"eval_samples_per_second": 533.043,
"eval_steps_per_second": 8.551,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.991680920124054,
"learning_rate": 4.1e-05,
"loss": 0.0861,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7692307692307693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7114093959731543,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6309523809523809,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8980891719745222,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7761194029850746,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.7777777777777778,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1477837860584259,
"eval_overall_accuracy": 0.9559438838296825,
"eval_overall_f1": 0.8126649076517152,
"eval_overall_precision": 0.7567567567567568,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3475,
"eval_samples_per_second": 538.055,
"eval_steps_per_second": 8.632,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 1.0064384937286377,
"learning_rate": 4.05e-05,
"loss": 0.0862,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.767123287671233,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.717948717948718,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.12853632867336273,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8225806451612903,
"eval_overall_precision": 0.7786259541984732,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3498,
"eval_samples_per_second": 534.521,
"eval_steps_per_second": 8.575,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.54794842004776,
"learning_rate": 4e-05,
"loss": 0.0787,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7027027027027027,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6265060240963856,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1396997570991516,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8149134487350199,
"eval_overall_precision": 0.765,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3498,
"eval_samples_per_second": 534.561,
"eval_steps_per_second": 8.576,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.174849510192871,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0787,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7007299270072994,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6216216216216216,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5111111111111111,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8405797101449276,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8285714285714286,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.13471455872058868,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8048452220726783,
"eval_overall_precision": 0.7627551020408163,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.349,
"eval_samples_per_second": 535.833,
"eval_steps_per_second": 8.596,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 2.117086887359619,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0776,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6751592356687899,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5760869565217391,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8954248366013071,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8450704225352113,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8108108108108109,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13748787343502045,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.8138297872340426,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3484,
"eval_samples_per_second": 536.695,
"eval_steps_per_second": 8.61,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.9372581839561462,
"learning_rate": 3.85e-05,
"loss": 0.0735,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8157894736842105,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7412587412587412,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6794871794871795,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8064516129032258,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8732394366197184,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8378378378378378,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13373343646526337,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8340080971659919,
"eval_overall_precision": 0.7923076923076923,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3486,
"eval_samples_per_second": 536.447,
"eval_steps_per_second": 8.606,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.0222715139389038,
"learning_rate": 3.8e-05,
"loss": 0.073,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1394394040107727,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8186666666666667,
"eval_overall_precision": 0.7694235588972431,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3498,
"eval_samples_per_second": 534.589,
"eval_steps_per_second": 8.576,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.7979212403297424,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0713,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7894736842105263,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7310344827586207,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6625,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7887323943661971,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.14228081703186035,
"eval_overall_accuracy": 0.9598818606940684,
"eval_overall_f1": 0.8123324396782841,
"eval_overall_precision": 0.7670886075949367,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.14,
"eval_steps_per_second": 8.569,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.5613954663276672,
"learning_rate": 3.7e-05,
"loss": 0.0672,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7843137254901962,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9067524115755627,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.6857142857142856,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7567567567567567,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.15085051953792572,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8100929614873837,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3515,
"eval_samples_per_second": 532.067,
"eval_steps_per_second": 8.536,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.650170624256134,
"learning_rate": 3.65e-05,
"loss": 0.0651,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.8082191780821918,
"eval_ORGANIZATION_f1": 0.7248322147651007,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14231501519680023,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8134228187919463,
"eval_overall_precision": 0.7690355329949239,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3486,
"eval_samples_per_second": 536.421,
"eval_steps_per_second": 8.606,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.0213465690612793,
"learning_rate": 3.6e-05,
"loss": 0.0659,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7142857142857142,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.9019607843137256,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13195978105068207,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8395061728395062,
"eval_overall_precision": 0.8095238095238095,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3507,
"eval_samples_per_second": 533.256,
"eval_steps_per_second": 8.555,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 1.3771088123321533,
"learning_rate": 3.55e-05,
"loss": 0.0619,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6956521739130436,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5833333333333334,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8732394366197184,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8378378378378378,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1354289948940277,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.833555259653795,
"eval_overall_precision": 0.7825,
"eval_overall_recall": 0.8917378917378918,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.594,
"eval_steps_per_second": 8.608,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.0532158613204956,
"learning_rate": 3.5e-05,
"loss": 0.06,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7083333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6455696202531646,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7741935483870968,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7272727272727273,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7887323943661971,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1394852250814438,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8217687074829932,
"eval_overall_precision": 0.7864583333333334,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3484,
"eval_samples_per_second": 536.678,
"eval_steps_per_second": 8.61,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.5543320178985596,
"learning_rate": 3.45e-05,
"loss": 0.0597,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8258064516129032,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6861313868613138,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6527777777777778,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.9114754098360656,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7575757575757576,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8450704225352113,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8108108108108109,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1364583671092987,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8310626702997275,
"eval_overall_precision": 0.7963446475195822,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3487,
"eval_samples_per_second": 536.339,
"eval_steps_per_second": 8.604,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.2729957103729248,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0571,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8421052631578948,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6962025316455697,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5913978494623656,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9120521172638437,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.89171974522293,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6410256410256411,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.15985752642154694,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.3483,
"eval_samples_per_second": 536.94,
"eval_steps_per_second": 8.614,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.3724058866500854,
"learning_rate": 3.35e-05,
"loss": 0.0567,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8496732026143791,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7310344827586207,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6625,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.9055374592833875,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14525863528251648,
"eval_overall_accuracy": 0.9633275904504061,
"eval_overall_f1": 0.8428184281842819,
"eval_overall_precision": 0.8036175710594315,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.595,
"eval_steps_per_second": 8.56,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.019172191619873,
"learning_rate": 3.3e-05,
"loss": 0.0538,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7222222222222222,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6582278481012658,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14389275014400482,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8260869565217391,
"eval_overall_precision": 0.7896103896103897,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3478,
"eval_samples_per_second": 537.643,
"eval_steps_per_second": 8.625,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.2027391493320465,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.055,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7092198581560285,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6578947368421053,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7887323943661971,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.14834968745708466,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.8157181571815719,
"eval_overall_precision": 0.7777777777777778,
"eval_overall_recall": 0.8575498575498576,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.458,
"eval_steps_per_second": 8.59,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.058028221130371,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.051,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6896551724137931,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.15179765224456787,
"eval_overall_accuracy": 0.9586512429239479,
"eval_overall_f1": 0.8227334235453315,
"eval_overall_precision": 0.7835051546391752,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.35,
"eval_samples_per_second": 534.248,
"eval_steps_per_second": 8.571,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.6165934205055237,
"learning_rate": 3.15e-05,
"loss": 0.0525,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7042253521126761,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6493506493506493,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8990228013029316,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7887323943661971,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1549917459487915,
"eval_overall_accuracy": 0.9586512429239479,
"eval_overall_f1": 0.8217687074829932,
"eval_overall_precision": 0.7864583333333334,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3479,
"eval_samples_per_second": 537.465,
"eval_steps_per_second": 8.622,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.6908597350120544,
"learning_rate": 3.1e-05,
"loss": 0.0513,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7575757575757576,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.13987548649311066,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.832876712328767,
"eval_overall_precision": 0.8021108179419525,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3495,
"eval_samples_per_second": 535.055,
"eval_steps_per_second": 8.584,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.47891664505004883,
"learning_rate": 3.05e-05,
"loss": 0.0511,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8533333333333334,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7162162162162162,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7619047619047619,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7058823529411765,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8055555555555555,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7631578947368421,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14294342696666718,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8317631224764468,
"eval_overall_precision": 0.7882653061224489,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.349,
"eval_samples_per_second": 535.775,
"eval_steps_per_second": 8.595,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.5005225539207458,
"learning_rate": 3e-05,
"loss": 0.0479,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8289473684210525,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6709677419354838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5777777777777777,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7887323943661971,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.16042561829090118,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8149134487350199,
"eval_overall_precision": 0.765,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3494,
"eval_samples_per_second": 535.212,
"eval_steps_per_second": 8.586,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 1.4673404693603516,
"learning_rate": 2.95e-05,
"loss": 0.0478,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8533333333333334,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7132867132867133,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6538461538461539,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14638105034828186,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8419618528610354,
"eval_overall_precision": 0.8067885117493473,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3474,
"eval_samples_per_second": 538.243,
"eval_steps_per_second": 8.635,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.4796440303325653,
"learning_rate": 2.9e-05,
"loss": 0.0452,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8266666666666668,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7222222222222222,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6582278481012658,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9025974025974027,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.879746835443038,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14712657034397125,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8331071913161466,
"eval_overall_precision": 0.7953367875647669,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.483,
"eval_steps_per_second": 8.591,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.6836230754852295,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0444,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7428571428571429,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6933333333333334,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8918032786885245,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8055555555555555,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7631578947368421,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.15814396739006042,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8353741496598639,
"eval_overall_precision": 0.7994791666666666,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.57,
"eval_steps_per_second": 8.608,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 1.3571970462799072,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0444,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8513513513513513,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7272727272727272,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8990228013029316,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8823529411764706,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8823529411764706,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14802251756191254,
"eval_overall_accuracy": 0.9643120846665025,
"eval_overall_f1": 0.8477366255144033,
"eval_overall_precision": 0.8174603174603174,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3488,
"eval_samples_per_second": 536.133,
"eval_steps_per_second": 8.601,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.737742304801941,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0449,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8421052631578948,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6845637583892618,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6071428571428571,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8695652173913043,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1639709323644638,
"eval_overall_accuracy": 0.9584051193699237,
"eval_overall_f1": 0.8236877523553163,
"eval_overall_precision": 0.7806122448979592,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3494,
"eval_samples_per_second": 535.143,
"eval_steps_per_second": 8.585,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.6632001996040344,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0415,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.847682119205298,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7313432835820897,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7101449275362319,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8794788273615636,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.14749835431575775,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.833103448275862,
"eval_overall_precision": 0.8074866310160428,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3486,
"eval_samples_per_second": 536.455,
"eval_steps_per_second": 8.606,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.8617376685142517,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0427,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8421052631578948,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7285714285714285,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.68,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8450704225352113,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8108108108108109,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1591494381427765,
"eval_overall_accuracy": 0.9606202313561408,
"eval_overall_f1": 0.8335588633288227,
"eval_overall_precision": 0.7938144329896907,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3508,
"eval_samples_per_second": 533.01,
"eval_steps_per_second": 8.551,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 1.4177937507629395,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0424,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8289473684210525,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7218045112781954,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7058823529411765,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7887323943661971,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.16404277086257935,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8285322359396434,
"eval_overall_precision": 0.798941798941799,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3479,
"eval_samples_per_second": 537.567,
"eval_steps_per_second": 8.624,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.5694997310638428,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0408,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7313432835820897,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7101449275362319,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8990228013029316,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7575757575757576,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.16149596869945526,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8372093023255812,
"eval_overall_precision": 0.8052631578947368,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.625,
"eval_steps_per_second": 8.593,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.3638904094696045,
"learning_rate": 2.5e-05,
"loss": 0.0403,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7142857142857142,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1615622639656067,
"eval_overall_accuracy": 0.9598818606940684,
"eval_overall_f1": 0.8265582655826558,
"eval_overall_precision": 0.7881136950904393,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3494,
"eval_samples_per_second": 535.228,
"eval_steps_per_second": 8.587,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.6612288951873779,
"learning_rate": 2.45e-05,
"loss": 0.0374,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7424242424242424,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7313432835820896,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8695652173913043,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.16601917147636414,
"eval_overall_accuracy": 0.9628353433423579,
"eval_overall_f1": 0.8367626886145405,
"eval_overall_precision": 0.8068783068783069,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.82,
"eval_steps_per_second": 8.58,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 1.5069667100906372,
"learning_rate": 2.4e-05,
"loss": 0.0382,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7152317880794703,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.627906976744186,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7777777777777778,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.17699261009693146,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8214765100671142,
"eval_overall_precision": 0.7766497461928934,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3471,
"eval_samples_per_second": 538.682,
"eval_steps_per_second": 8.642,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.0662306547164917,
"learning_rate": 2.35e-05,
"loss": 0.038,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.846153846153846,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7951807228915663,
"eval_LOCATION_recall": 0.9041095890410958,
"eval_ORGANIZATION_f1": 0.7391304347826088,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6986301369863014,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.17185063660144806,
"eval_overall_accuracy": 0.9596357371400444,
"eval_overall_f1": 0.8335588633288227,
"eval_overall_precision": 0.7938144329896907,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3507,
"eval_samples_per_second": 533.285,
"eval_steps_per_second": 8.555,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.5915600061416626,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0362,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7183098591549296,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6623376623376623,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1768696904182434,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8342391304347826,
"eval_overall_precision": 0.7974025974025974,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3484,
"eval_samples_per_second": 536.69,
"eval_steps_per_second": 8.61,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.5453677773475647,
"learning_rate": 2.25e-05,
"loss": 0.034,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8311688311688312,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7285714285714285,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.68,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8888888888888887,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.16523310542106628,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.840381991814461,
"eval_overall_precision": 0.806282722513089,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.694,
"eval_steps_per_second": 8.578,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 1.1855400800704956,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.033,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7480916030534351,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8450704225352113,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8108108108108109,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.16871850192546844,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.837465564738292,
"eval_overall_precision": 0.8106666666666666,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3502,
"eval_samples_per_second": 534.014,
"eval_steps_per_second": 8.567,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.6215670704841614,
"learning_rate": 2.15e-05,
"loss": 0.0357,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7619047619047619,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7868852459016393,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.16778957843780518,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.841225626740947,
"eval_overall_precision": 0.8228882833787466,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3498,
"eval_samples_per_second": 534.631,
"eval_steps_per_second": 8.577,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.38038042187690735,
"learning_rate": 2.1e-05,
"loss": 0.0341,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8533333333333334,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7258064516129032,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7627118644067796,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8823529411764707,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.16733954846858978,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8359046283309959,
"eval_overall_precision": 0.8232044198895028,
"eval_overall_recall": 0.8490028490028491,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.675,
"eval_steps_per_second": 8.562,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.5302915573120117,
"learning_rate": 2.05e-05,
"loss": 0.0324,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7375886524822695,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7741935483870968,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7272727272727273,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.17023777961730957,
"eval_overall_accuracy": 0.9633275904504061,
"eval_overall_f1": 0.834924965893588,
"eval_overall_precision": 0.8010471204188482,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3498,
"eval_samples_per_second": 534.593,
"eval_steps_per_second": 8.576,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 1.338559627532959,
"learning_rate": 2e-05,
"loss": 0.0333,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8609271523178808,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7368421052631577,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.9013157894736842,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8896103896103896,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8064516129032258,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.16547058522701263,
"eval_overall_accuracy": 0.9657888259906473,
"eval_overall_f1": 0.8500000000000001,
"eval_overall_precision": 0.8292682926829268,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.07,
"eval_steps_per_second": 8.568,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.4147072434425354,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0327,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7428571428571429,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6933333333333334,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8695652173913043,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.17973226308822632,
"eval_overall_accuracy": 0.9608663549101649,
"eval_overall_f1": 0.8342391304347826,
"eval_overall_precision": 0.7974025974025974,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3496,
"eval_samples_per_second": 534.945,
"eval_steps_per_second": 8.582,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.6705744862556458,
"learning_rate": 1.9e-05,
"loss": 0.0315,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8421052631578948,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7352941176470589,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.704225352112676,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1808030903339386,
"eval_overall_accuracy": 0.9601279842480925,
"eval_overall_f1": 0.8301369863013699,
"eval_overall_precision": 0.7994722955145118,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.545,
"eval_steps_per_second": 8.608,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.7228378653526306,
"learning_rate": 1.85e-05,
"loss": 0.0295,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8571428571428571,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8148148148148148,
"eval_LOCATION_recall": 0.9041095890410958,
"eval_ORGANIZATION_f1": 0.7153284671532848,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6805555555555556,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8709677419354839,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.17379428446292877,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.8458390177353343,
"eval_overall_precision": 0.8115183246073299,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.3488,
"eval_samples_per_second": 536.14,
"eval_steps_per_second": 8.601,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.5657730102539062,
"learning_rate": 1.8e-05,
"loss": 0.0296,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7424242424242424,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7313432835820896,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1676260232925415,
"eval_overall_accuracy": 0.963081466896382,
"eval_overall_f1": 0.8449931412894376,
"eval_overall_precision": 0.8148148148148148,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.562,
"eval_steps_per_second": 8.608,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.8568927645683289,
"learning_rate": 1.75e-05,
"loss": 0.0297,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8533333333333334,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7183098591549296,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8786885245901639,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8115942028985507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1690235435962677,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8354080221300137,
"eval_overall_precision": 0.8118279569892473,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3507,
"eval_samples_per_second": 533.268,
"eval_steps_per_second": 8.555,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.7192606329917908,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.028,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8235294117647058,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7575757575757576,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.746268656716418,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8709677419354839,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.17469918727874756,
"eval_overall_accuracy": 0.9648043317745508,
"eval_overall_f1": 0.8484848484848485,
"eval_overall_precision": 0.8213333333333334,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3489,
"eval_samples_per_second": 535.899,
"eval_steps_per_second": 8.597,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.2507493793964386,
"learning_rate": 1.65e-05,
"loss": 0.0278,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7391304347826088,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6986301369863014,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8786885245901639,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.17670658230781555,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8386206896551723,
"eval_overall_precision": 0.8128342245989305,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.521,
"eval_steps_per_second": 8.607,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.48297932744026184,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0292,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8235294117647058,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7246376811594203,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.684931506849315,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.9042904290429042,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8954248366013072,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.18086454272270203,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.8379120879120879,
"eval_overall_precision": 0.8090185676392573,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.689,
"eval_steps_per_second": 8.594,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.1779003143310547,
"learning_rate": 1.55e-05,
"loss": 0.0264,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8496732026143791,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7092198581560285,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6578947368421053,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8954248366013071,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8709677419354839,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.17253029346466064,
"eval_overall_accuracy": 0.9640659611124784,
"eval_overall_f1": 0.8442622950819673,
"eval_overall_precision": 0.8110236220472441,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.704,
"eval_steps_per_second": 8.578,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.405724436044693,
"learning_rate": 1.5e-05,
"loss": 0.0259,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.855263157894737,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8227848101265823,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7083333333333334,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8954248366013071,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.17524121701717377,
"eval_overall_accuracy": 0.9638198375584544,
"eval_overall_f1": 0.8449931412894376,
"eval_overall_precision": 0.8148148148148148,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3487,
"eval_samples_per_second": 536.201,
"eval_steps_per_second": 8.602,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 1.9814850091934204,
"learning_rate": 1.45e-05,
"loss": 0.0274,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.855263157894737,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8227848101265823,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7083333333333334,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19072633981704712,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8392370572207084,
"eval_overall_precision": 0.804177545691906,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.349,
"eval_samples_per_second": 535.864,
"eval_steps_per_second": 8.597,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.3593089282512665,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0273,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8496732026143791,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7518796992481205,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7352941176470589,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8737864077669903,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.7777777777777778,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1915425956249237,
"eval_overall_accuracy": 0.9598818606940684,
"eval_overall_f1": 0.832876712328767,
"eval_overall_precision": 0.8021108179419525,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3484,
"eval_samples_per_second": 536.761,
"eval_steps_per_second": 8.611,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.8845640420913696,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0279,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8289473684210525,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7323943661971831,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6753246753246753,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1847066581249237,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8315217391304348,
"eval_overall_precision": 0.7948051948051948,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3502,
"eval_samples_per_second": 534.048,
"eval_steps_per_second": 8.568,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.45966747403144836,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0267,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8421052631578948,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7480916030534351,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.18399041891098022,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.8335625859697385,
"eval_overall_precision": 0.8058510638297872,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3487,
"eval_samples_per_second": 536.311,
"eval_steps_per_second": 8.604,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.6150727868080139,
"learning_rate": 1.25e-05,
"loss": 0.0257,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.846153846153846,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7951807228915663,
"eval_LOCATION_recall": 0.9041095890410958,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.18748342990875244,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8348993288590604,
"eval_overall_precision": 0.7893401015228426,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.3479,
"eval_samples_per_second": 537.546,
"eval_steps_per_second": 8.624,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.12720619142055511,
"learning_rate": 1.2e-05,
"loss": 0.0257,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8421052631578948,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7246376811594203,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.684931506849315,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.18419043719768524,
"eval_overall_accuracy": 0.9628353433423579,
"eval_overall_f1": 0.8406593406593407,
"eval_overall_precision": 0.8116710875331565,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3487,
"eval_samples_per_second": 536.289,
"eval_steps_per_second": 8.604,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 1.0697262287139893,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0248,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8289473684210525,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7142857142857142,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8766233766233766,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19783645868301392,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8278688524590164,
"eval_overall_precision": 0.7952755905511811,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3502,
"eval_samples_per_second": 534.03,
"eval_steps_per_second": 8.567,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 1.0857927799224854,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0248,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19514693319797516,
"eval_overall_accuracy": 0.9606202313561408,
"eval_overall_f1": 0.8321964529331515,
"eval_overall_precision": 0.7984293193717278,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.645,
"eval_steps_per_second": 8.561,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.4629979431629181,
"learning_rate": 1.05e-05,
"loss": 0.0237,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7183098591549296,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8758169934640523,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19404210150241852,
"eval_overall_accuracy": 0.9603741078021166,
"eval_overall_f1": 0.8367626886145405,
"eval_overall_precision": 0.8068783068783069,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3494,
"eval_samples_per_second": 535.278,
"eval_steps_per_second": 8.587,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.49161767959594727,
"learning_rate": 1e-05,
"loss": 0.0261,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7703703703703704,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7428571428571429,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19337113201618195,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8321964529331515,
"eval_overall_precision": 0.7984293193717278,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3493,
"eval_samples_per_second": 535.38,
"eval_steps_per_second": 8.589,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 1.3529359102249146,
"learning_rate": 9.5e-06,
"loss": 0.0234,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7462686567164178,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7246376811594203,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8823529411764707,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19133438169956207,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.8395061728395062,
"eval_overall_precision": 0.8095238095238095,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3476,
"eval_samples_per_second": 537.954,
"eval_steps_per_second": 8.63,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.8348244428634644,
"learning_rate": 9e-06,
"loss": 0.0217,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7391304347826088,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6986301369863014,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8794788273615636,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8709677419354839,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19519662857055664,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8399452804377566,
"eval_overall_precision": 0.8078947368421052,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.512,
"eval_steps_per_second": 8.591,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 1.4528393745422363,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0234,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7846153846153847,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7846153846153846,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.19463619589805603,
"eval_overall_accuracy": 0.9655427024366232,
"eval_overall_f1": 0.8551724137931035,
"eval_overall_precision": 0.8288770053475936,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.3489,
"eval_samples_per_second": 536.036,
"eval_steps_per_second": 8.6,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.33660465478897095,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0237,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8387096774193549,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7462686567164178,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7246376811594203,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7999999999999999,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19823411107063293,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8376534788540245,
"eval_overall_precision": 0.8036649214659686,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.564,
"eval_steps_per_second": 8.56,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.6225272417068481,
"learning_rate": 7.5e-06,
"loss": 0.0247,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7083333333333334,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.2002585530281067,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8365122615803815,
"eval_overall_precision": 0.8015665796344648,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.708,
"eval_steps_per_second": 8.578,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.7242019772529602,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0218,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7352941176470589,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.704225352112676,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9310344827586207,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19523298740386963,
"eval_overall_accuracy": 0.9640659611124784,
"eval_overall_f1": 0.8422496570644719,
"eval_overall_precision": 0.8121693121693122,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3519,
"eval_samples_per_second": 531.467,
"eval_steps_per_second": 8.526,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 1.2844712734222412,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0224,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8496732026143791,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7611940298507462,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7391304347826086,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1952124983072281,
"eval_overall_accuracy": 0.9640659611124784,
"eval_overall_f1": 0.8422496570644719,
"eval_overall_precision": 0.8121693121693122,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.349,
"eval_samples_per_second": 535.792,
"eval_steps_per_second": 8.596,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.27208393812179565,
"learning_rate": 6e-06,
"loss": 0.0211,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7338129496402878,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6891891891891891,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1970175951719284,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.834924965893588,
"eval_overall_precision": 0.8010471204188482,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3477,
"eval_samples_per_second": 537.813,
"eval_steps_per_second": 8.628,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.7367871999740601,
"learning_rate": 5.500000000000001e-06,
"loss": 0.021,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8289473684210525,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7183098591549296,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.20013782382011414,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8317373461012312,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.725,
"eval_steps_per_second": 8.595,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.4959828555583954,
"learning_rate": 5e-06,
"loss": 0.0216,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7611940298507462,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7391304347826086,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19662083685398102,
"eval_overall_accuracy": 0.963081466896382,
"eval_overall_f1": 0.8363136176066025,
"eval_overall_precision": 0.8085106382978723,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.654,
"eval_steps_per_second": 8.593,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.6600481867790222,
"learning_rate": 4.5e-06,
"loss": 0.0217,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7083333333333334,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8285714285714286,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8055555555555556,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19578596949577332,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.8387978142076502,
"eval_overall_precision": 0.8057742782152231,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3484,
"eval_samples_per_second": 536.773,
"eval_steps_per_second": 8.611,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.1194983422756195,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0198,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.7611940298507462,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7391304347826086,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19786879420280457,
"eval_overall_accuracy": 0.9635737140044303,
"eval_overall_f1": 0.8422496570644719,
"eval_overall_precision": 0.8121693121693122,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3495,
"eval_samples_per_second": 535.03,
"eval_steps_per_second": 8.583,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.16003356873989105,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0205,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8289473684210525,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7669172932330828,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8450704225352113,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8108108108108109,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.19753791391849518,
"eval_overall_accuracy": 0.9635737140044303,
"eval_overall_f1": 0.8434065934065934,
"eval_overall_precision": 0.8143236074270557,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.578,
"eval_steps_per_second": 8.592,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.8688186407089233,
"learning_rate": 3e-06,
"loss": 0.0206,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8289473684210525,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7555555555555555,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8859934853420196,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1996561884880066,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8367626886145405,
"eval_overall_precision": 0.8068783068783069,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.588,
"eval_steps_per_second": 8.592,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.6198663115501404,
"learning_rate": 2.5e-06,
"loss": 0.0214,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8387096774193549,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7083333333333334,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8253968253968255,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.896551724137931,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19923867285251617,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8353741496598639,
"eval_overall_precision": 0.7994791666666666,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3512,
"eval_samples_per_second": 532.477,
"eval_steps_per_second": 8.542,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.5730480551719666,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0208,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8333333333333334,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7831325301204819,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7669172932330828,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8450704225352113,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8108108108108109,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.19816720485687256,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8387978142076502,
"eval_overall_precision": 0.8057742782152231,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.457,
"eval_steps_per_second": 8.59,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.7892258167266846,
"learning_rate": 1.5e-06,
"loss": 0.0217,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7669172932330828,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19672809541225433,
"eval_overall_accuracy": 0.963081466896382,
"eval_overall_f1": 0.8395061728395062,
"eval_overall_precision": 0.8095238095238095,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.348,
"eval_samples_per_second": 537.376,
"eval_steps_per_second": 8.621,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.4192006289958954,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0205,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8387096774193549,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7669172932330828,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19882169365882874,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8372093023255812,
"eval_overall_precision": 0.8052631578947368,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.35,
"eval_samples_per_second": 534.343,
"eval_steps_per_second": 8.572,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.21814487874507904,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0204,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7669172932330828,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7812500000000001,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19684545695781708,
"eval_overall_accuracy": 0.9628353433423579,
"eval_overall_f1": 0.8383561643835615,
"eval_overall_precision": 0.8073878627968337,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3493,
"eval_samples_per_second": 535.431,
"eval_steps_per_second": 8.59,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.46098318696022034,
"learning_rate": 0.0,
"loss": 0.022,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8441558441558442,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.7669172932330828,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7936507936507937,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8169014084507041,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7837837837837838,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.19717250764369965,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.8383561643835615,
"eval_overall_precision": 0.8073878627968337,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.575,
"eval_steps_per_second": 8.608,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5043631411410816.0,
"train_loss": 0.06754140655949431,
"train_runtime": 594.8485,
"train_samples_per_second": 283.77,
"train_steps_per_second": 17.82
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5043631411410816.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}