nerugm-lora-r16-2 / trainer_state.json
apwic's picture
End of training
249e382 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.8945987224578857,
"learning_rate": 4.9500000000000004e-05,
"loss": 1.1381,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.0,
"eval_PERSON_recall": 0.0,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.6853168606758118,
"eval_overall_accuracy": 0.8448836627470603,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_runtime": 0.3663,
"eval_samples_per_second": 510.496,
"eval_steps_per_second": 8.19,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.1807020902633667,
"learning_rate": 4.9e-05,
"loss": 0.6775,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.0,
"eval_PERSON_recall": 0.0,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5612640976905823,
"eval_overall_accuracy": 0.8466349762321741,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_runtime": 0.3703,
"eval_samples_per_second": 505.03,
"eval_steps_per_second": 8.102,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.3289912939071655,
"learning_rate": 4.85e-05,
"loss": 0.5563,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.1818181818181818,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.5,
"eval_LOCATION_recall": 0.1111111111111111,
"eval_ORGANIZATION_f1": 0.021276595744680854,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.05263157894736842,
"eval_ORGANIZATION_recall": 0.013333333333333334,
"eval_PERSON_f1": 0.2980392156862745,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.3392857142857143,
"eval_PERSON_recall": 0.26573426573426573,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.18181818181818185,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.2222222222222222,
"eval_TIME_recall": 0.15384615384615385,
"eval_loss": 0.42658355832099915,
"eval_overall_accuracy": 0.877658243682762,
"eval_overall_f1": 0.201980198019802,
"eval_overall_precision": 0.3072289156626506,
"eval_overall_recall": 0.1504424778761062,
"eval_runtime": 0.3682,
"eval_samples_per_second": 507.92,
"eval_steps_per_second": 8.148,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 2.218233346939087,
"learning_rate": 4.8e-05,
"loss": 0.4194,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.4426229508196721,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.54,
"eval_LOCATION_recall": 0.375,
"eval_ORGANIZATION_f1": 0.3597122302158273,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.390625,
"eval_ORGANIZATION_recall": 0.3333333333333333,
"eval_PERSON_f1": 0.5964912280701755,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.5125628140703518,
"eval_PERSON_recall": 0.7132867132867133,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.5925925925925927,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.5714285714285714,
"eval_TIME_recall": 0.6153846153846154,
"eval_loss": 0.3157876431941986,
"eval_overall_accuracy": 0.9126845133850388,
"eval_overall_f1": 0.4892086330935252,
"eval_overall_precision": 0.47752808988764045,
"eval_overall_recall": 0.5014749262536873,
"eval_runtime": 0.3699,
"eval_samples_per_second": 505.61,
"eval_steps_per_second": 8.111,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.1470197439193726,
"learning_rate": 4.75e-05,
"loss": 0.3199,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.625,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.5681818181818182,
"eval_LOCATION_recall": 0.6944444444444444,
"eval_ORGANIZATION_f1": 0.47500000000000003,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.4470588235294118,
"eval_ORGANIZATION_recall": 0.5066666666666667,
"eval_PERSON_f1": 0.764525993883792,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.6793478260869565,
"eval_PERSON_recall": 0.8741258741258742,
"eval_QUANTITY_f1": 0.35294117647058826,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.32142857142857145,
"eval_QUANTITY_recall": 0.391304347826087,
"eval_TIME_f1": 0.7307692307692306,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7307692307692307,
"eval_TIME_recall": 0.7307692307692307,
"eval_loss": 0.25322219729423523,
"eval_overall_accuracy": 0.9301976482361771,
"eval_overall_f1": 0.6426666666666666,
"eval_overall_precision": 0.5863746958637469,
"eval_overall_recall": 0.7109144542772862,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.27,
"eval_steps_per_second": 8.09,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.8425076603889465,
"learning_rate": 4.7e-05,
"loss": 0.2663,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.679245283018868,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6206896551724138,
"eval_LOCATION_recall": 0.75,
"eval_ORGANIZATION_f1": 0.5764705882352941,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5157894736842106,
"eval_ORGANIZATION_recall": 0.6533333333333333,
"eval_PERSON_f1": 0.8125,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7344632768361582,
"eval_PERSON_recall": 0.9090909090909091,
"eval_QUANTITY_f1": 0.35294117647058826,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.32142857142857145,
"eval_QUANTITY_recall": 0.391304347826087,
"eval_TIME_f1": 0.7241379310344829,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.65625,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.2125054895877838,
"eval_overall_accuracy": 0.9362021516137102,
"eval_overall_f1": 0.6939313984168866,
"eval_overall_precision": 0.6276849642004774,
"eval_overall_recall": 0.775811209439528,
"eval_runtime": 0.3723,
"eval_samples_per_second": 502.303,
"eval_steps_per_second": 8.058,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.9470153450965881,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.2335,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.751592356687898,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6941176470588235,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.5862068965517241,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5151515151515151,
"eval_ORGANIZATION_recall": 0.68,
"eval_PERSON_f1": 0.8148148148148148,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7292817679558011,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.4444444444444444,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.3870967741935484,
"eval_QUANTITY_recall": 0.5217391304347826,
"eval_TIME_f1": 0.7017543859649122,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6451612903225806,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1960044652223587,
"eval_overall_accuracy": 0.9392044033024769,
"eval_overall_f1": 0.7154046997389034,
"eval_overall_precision": 0.6416861826697893,
"eval_overall_recall": 0.8082595870206489,
"eval_runtime": 0.3721,
"eval_samples_per_second": 502.608,
"eval_steps_per_second": 8.063,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 1.4180433750152588,
"learning_rate": 4.600000000000001e-05,
"loss": 0.2093,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7625000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6931818181818182,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.6101694915254237,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5294117647058824,
"eval_ORGANIZATION_recall": 0.72,
"eval_PERSON_f1": 0.8490566037735848,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7714285714285715,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.47058823529411764,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.42857142857142855,
"eval_QUANTITY_recall": 0.5217391304347826,
"eval_TIME_f1": 0.7457627118644068,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.17360921204090118,
"eval_overall_accuracy": 0.9449587190392794,
"eval_overall_f1": 0.7424836601307189,
"eval_overall_precision": 0.6666666666666666,
"eval_overall_recall": 0.8377581120943953,
"eval_runtime": 0.3739,
"eval_samples_per_second": 500.185,
"eval_steps_per_second": 8.024,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.8917080163955688,
"learning_rate": 4.55e-05,
"loss": 0.1945,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7682926829268292,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6847826086956522,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.6179775280898877,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5339805825242718,
"eval_ORGANIZATION_recall": 0.7333333333333333,
"eval_PERSON_f1": 0.8553054662379421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7916666666666666,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.4814814814814815,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.41935483870967744,
"eval_QUANTITY_recall": 0.5652173913043478,
"eval_TIME_f1": 0.7241379310344829,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.65625,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.17519919574260712,
"eval_overall_accuracy": 0.9439579684763573,
"eval_overall_f1": 0.7450980392156863,
"eval_overall_precision": 0.6690140845070423,
"eval_overall_recall": 0.8407079646017699,
"eval_runtime": 0.3696,
"eval_samples_per_second": 505.937,
"eval_steps_per_second": 8.117,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 2.473076343536377,
"learning_rate": 4.5e-05,
"loss": 0.1804,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.627906976744186,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5567010309278351,
"eval_ORGANIZATION_recall": 0.72,
"eval_PERSON_f1": 0.8434504792332268,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7764705882352941,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.5423728813559322,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.4444444444444444,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7457627118644068,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.16381332278251648,
"eval_overall_accuracy": 0.9457092819614711,
"eval_overall_f1": 0.7506561679790027,
"eval_overall_precision": 0.6761229314420804,
"eval_overall_recall": 0.8436578171091446,
"eval_runtime": 0.3732,
"eval_samples_per_second": 501.085,
"eval_steps_per_second": 8.039,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.6517131328582764,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1692,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.6775956284153005,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5740740740740741,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8444444444444446,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7732558139534884,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.5357142857142857,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.45454545454545453,
"eval_QUANTITY_recall": 0.6521739130434783,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.15897886455059052,
"eval_overall_accuracy": 0.9499624718538904,
"eval_overall_f1": 0.7769028871391076,
"eval_overall_precision": 0.6997635933806147,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.355,
"eval_steps_per_second": 8.091,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 2.3833324909210205,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1645,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7947019867549668,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6511627906976744,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5773195876288659,
"eval_ORGANIZATION_recall": 0.7466666666666667,
"eval_PERSON_f1": 0.8571428571428571,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1452288031578064,
"eval_overall_accuracy": 0.9514635976982737,
"eval_overall_f1": 0.7767253044654939,
"eval_overall_precision": 0.7175,
"eval_overall_recall": 0.8466076696165191,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.307,
"eval_steps_per_second": 8.09,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 1.4393219947814941,
"learning_rate": 4.35e-05,
"loss": 0.1572,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.6775956284153005,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5740740740740741,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8562300319488818,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.788235294117647,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8070175438596492,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7419354838709677,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1519501805305481,
"eval_overall_accuracy": 0.9514635976982737,
"eval_overall_f1": 0.7883597883597884,
"eval_overall_precision": 0.7146282973621103,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.618,
"eval_steps_per_second": 8.079,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.3148809671401978,
"learning_rate": 4.3e-05,
"loss": 0.1538,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7972972972972973,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.6630434782608695,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5596330275229358,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8664495114006516,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8109756097560976,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1491760015487671,
"eval_overall_accuracy": 0.9509632224168126,
"eval_overall_f1": 0.788770053475936,
"eval_overall_precision": 0.7212713936430318,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3732,
"eval_samples_per_second": 501.038,
"eval_steps_per_second": 8.038,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.9081311225891113,
"learning_rate": 4.25e-05,
"loss": 0.1483,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.59375,
"eval_ORGANIZATION_recall": 0.76,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1384066790342331,
"eval_overall_accuracy": 0.9549662246685013,
"eval_overall_f1": 0.7934336525307797,
"eval_overall_precision": 0.7397959183673469,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.3693,
"eval_samples_per_second": 506.326,
"eval_steps_per_second": 8.123,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.228157877922058,
"learning_rate": 4.2e-05,
"loss": 0.145,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6737967914438503,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5625,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8681672025723473,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8035714285714286,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7407407407407407,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6451612903225806,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15306319296360016,
"eval_overall_accuracy": 0.9497122842131599,
"eval_overall_f1": 0.7874015748031495,
"eval_overall_precision": 0.7092198581560284,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3725,
"eval_samples_per_second": 502.005,
"eval_steps_per_second": 8.054,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.6019057035446167,
"learning_rate": 4.15e-05,
"loss": 0.1378,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7770700636942675,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.6703296703296704,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5700934579439252,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8778877887788779,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.83125,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.146218940615654,
"eval_overall_accuracy": 0.9514635976982737,
"eval_overall_f1": 0.7925531914893617,
"eval_overall_precision": 0.7215496368038741,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3673,
"eval_samples_per_second": 509.115,
"eval_steps_per_second": 8.168,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.6048269867897034,
"learning_rate": 4.1e-05,
"loss": 0.137,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.6486486486486486,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5454545454545454,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8837209302325583,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8417721518987342,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7407407407407407,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6451612903225806,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.143734872341156,
"eval_overall_accuracy": 0.9522141606204654,
"eval_overall_f1": 0.7925531914893617,
"eval_overall_precision": 0.7215496368038741,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.734,
"eval_steps_per_second": 8.081,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.9862064719200134,
"learning_rate": 4.05e-05,
"loss": 0.1316,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6931818181818181,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6039603960396039,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.868421052631579,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8198757763975155,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.7407407407407407,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6451612903225806,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13715997338294983,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.7940780619111709,
"eval_overall_precision": 0.7301980198019802,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.829,
"eval_steps_per_second": 8.083,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.5772024393081665,
"learning_rate": 4e-05,
"loss": 0.1274,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7875000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.6918918918918919,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5818181818181818,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7586206896551724,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6875,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1509571373462677,
"eval_overall_accuracy": 0.950212659494621,
"eval_overall_f1": 0.7916120576671036,
"eval_overall_precision": 0.7122641509433962,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.213,
"eval_steps_per_second": 8.057,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.3061535358428955,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.1279,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7111111111111111,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6095238095238096,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8737864077669902,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8132530120481928,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7407407407407407,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6451612903225806,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14436930418014526,
"eval_overall_accuracy": 0.9532149111833875,
"eval_overall_f1": 0.8052980132450331,
"eval_overall_precision": 0.7307692307692307,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3764,
"eval_samples_per_second": 496.865,
"eval_steps_per_second": 7.971,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.9500447511672974,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.1256,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7159090909090909,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6237623762376238,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7142857142857143,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6060606060606061,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13468235731124878,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8123324396782842,
"eval_overall_precision": 0.7444717444717445,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3693,
"eval_samples_per_second": 506.364,
"eval_steps_per_second": 8.123,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 1.3265873193740845,
"learning_rate": 3.85e-05,
"loss": 0.123,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7262569832402236,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8242424242424242,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13530714809894562,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8037383177570093,
"eval_overall_precision": 0.7341463414634146,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3693,
"eval_samples_per_second": 506.356,
"eval_steps_per_second": 8.123,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.4870867729187012,
"learning_rate": 3.8e-05,
"loss": 0.1219,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7654320987654321,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6888888888888889,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7032967032967032,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5981308411214953,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8794788273615636,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.823170731707317,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7017543859649124,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5882352941176471,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7586206896551724,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6875,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14730946719646454,
"eval_overall_accuracy": 0.9519639729797348,
"eval_overall_f1": 0.7911227154046998,
"eval_overall_precision": 0.7096018735362998,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.446,
"eval_steps_per_second": 8.061,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 1.858078956604004,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.1193,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.735632183908046,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6464646464646465,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8896103896103895,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1400519758462906,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8128342245989304,
"eval_overall_precision": 0.7432762836185819,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.368,
"eval_samples_per_second": 508.1,
"eval_steps_per_second": 8.151,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.955053985118866,
"learning_rate": 3.7e-05,
"loss": 0.1168,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7159090909090909,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6237623762376238,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13576149940490723,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8053691275167786,
"eval_overall_precision": 0.7389162561576355,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3716,
"eval_samples_per_second": 503.212,
"eval_steps_per_second": 8.073,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 1.6411521434783936,
"learning_rate": 3.65e-05,
"loss": 0.1132,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7625000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6931818181818182,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7073170731707319,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.651685393258427,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14072290062904358,
"eval_overall_accuracy": 0.9547160370277709,
"eval_overall_f1": 0.7972972972972973,
"eval_overall_precision": 0.7356608478802993,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.296,
"eval_steps_per_second": 8.09,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.1676483154296875,
"learning_rate": 3.6e-05,
"loss": 0.115,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7231638418079096,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6274509803921569,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8322981366459627,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6909090909090908,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.59375,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13657206296920776,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8080536912751678,
"eval_overall_precision": 0.7413793103448276,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3699,
"eval_samples_per_second": 505.486,
"eval_steps_per_second": 8.109,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 1.2002038955688477,
"learning_rate": 3.55e-05,
"loss": 0.112,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7386363636363636,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6435643564356436,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6909090909090908,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.59375,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13843736052513123,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8183041722745626,
"eval_overall_precision": 0.7524752475247525,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.371,
"eval_samples_per_second": 504.044,
"eval_steps_per_second": 8.086,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.0138002634048462,
"learning_rate": 3.5e-05,
"loss": 0.1112,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7701863354037267,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7303370786516854,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6310679611650486,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8947368421052632,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13617390394210815,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.804780876494024,
"eval_overall_precision": 0.7318840579710145,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3711,
"eval_samples_per_second": 503.907,
"eval_steps_per_second": 8.084,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.6963276863098145,
"learning_rate": 3.45e-05,
"loss": 0.1093,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7455621301775148,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6702127659574468,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8947368421052632,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6909090909090908,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.59375,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13229180872440338,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.817320703653586,
"eval_overall_precision": 0.755,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.369,
"eval_samples_per_second": 506.747,
"eval_steps_per_second": 8.13,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 2.4005796909332275,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.1075,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8157894736842106,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7425149700598803,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6739130434782609,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6909090909090908,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.59375,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.12926289439201355,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8257887517146778,
"eval_overall_precision": 0.7717948717948718,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.175,
"eval_steps_per_second": 8.056,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.497031807899475,
"learning_rate": 3.35e-05,
"loss": 0.1046,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7770700636942675,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.744186046511628,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6597938144329897,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13126622140407562,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.819538670284939,
"eval_overall_precision": 0.7587939698492462,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3762,
"eval_samples_per_second": 497.031,
"eval_steps_per_second": 7.974,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.8285422921180725,
"learning_rate": 3.3e-05,
"loss": 0.1017,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7314285714285714,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8823529411764706,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7586206896551724,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6875,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1426933854818344,
"eval_overall_accuracy": 0.9547160370277709,
"eval_overall_f1": 0.799468791500664,
"eval_overall_precision": 0.7270531400966184,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.449,
"eval_steps_per_second": 8.061,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.9264658689498901,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.1071,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7231638418079096,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6274509803921569,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14034150540828705,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.8112449799196788,
"eval_overall_precision": 0.7426470588235294,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3705,
"eval_samples_per_second": 504.772,
"eval_steps_per_second": 8.098,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.7772150039672852,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.1026,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.12969908118247986,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8153214774281805,
"eval_overall_precision": 0.7602040816326531,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3711,
"eval_samples_per_second": 503.942,
"eval_steps_per_second": 8.085,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 5.3707380294799805,
"learning_rate": 3.15e-05,
"loss": 0.1005,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7570621468926553,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6568627450980392,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8954248366013072,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14334312081336975,
"eval_overall_accuracy": 0.9549662246685013,
"eval_overall_f1": 0.8127490039840637,
"eval_overall_precision": 0.7391304347826086,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3705,
"eval_samples_per_second": 504.68,
"eval_steps_per_second": 8.096,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 1.382991075515747,
"learning_rate": 3.1e-05,
"loss": 0.0981,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8157894736842106,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7386363636363636,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6435643564356436,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8990228013029316,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14039599895477295,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8192771084337348,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.371,
"eval_samples_per_second": 503.978,
"eval_steps_per_second": 8.085,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.9052088260650635,
"learning_rate": 3.05e-05,
"loss": 0.0982,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7745664739884393,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6836734693877551,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8888888888888888,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1408725529909134,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8225806451612903,
"eval_overall_precision": 0.7555555555555555,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3728,
"eval_samples_per_second": 501.569,
"eval_steps_per_second": 8.047,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 1.2666678428649902,
"learning_rate": 3e-05,
"loss": 0.0986,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8859934853420195,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8292682926829268,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13242048025131226,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8211382113821138,
"eval_overall_precision": 0.7593984962406015,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.864,
"eval_steps_per_second": 8.099,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 1.3640594482421875,
"learning_rate": 2.95e-05,
"loss": 0.0963,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7674418604651163,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6804123711340206,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8888888888888888,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1359548419713974,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8227334235453315,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.827,
"eval_steps_per_second": 8.099,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 1.9110503196716309,
"learning_rate": 2.9e-05,
"loss": 0.096,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7719298245614036,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8983606557377047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8070175438596492,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7419354838709677,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1379159390926361,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8236877523553163,
"eval_overall_precision": 0.7574257425742574,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.833,
"eval_steps_per_second": 8.083,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.9015399813652039,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0944,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7333333333333333,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.12910011410713196,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8342541436464089,
"eval_overall_precision": 0.7844155844155845,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3719,
"eval_samples_per_second": 502.787,
"eval_steps_per_second": 8.066,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 1.5744454860687256,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0959,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.788235294117647,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7052631578947368,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.13805752992630005,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8238482384823848,
"eval_overall_precision": 0.7619047619047619,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.769,
"eval_steps_per_second": 8.05,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.3224737644195557,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0935,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7647058823529413,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9078947368421052,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13827811181545258,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8249660786974219,
"eval_overall_precision": 0.7638190954773869,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3741,
"eval_samples_per_second": 499.811,
"eval_steps_per_second": 8.018,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.8794982433319092,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0903,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7514450867052023,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6632653061224489,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9042904290429041,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13555409014225006,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8227334235453315,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.861,
"eval_steps_per_second": 8.099,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 1.307417869567871,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0933,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7816091954022988,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6868686868686869,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9019607843137255,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.5964912280701754,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.15163101255893707,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.8161073825503355,
"eval_overall_precision": 0.7487684729064039,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3701,
"eval_samples_per_second": 505.224,
"eval_steps_per_second": 8.105,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 1.3334672451019287,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.093,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7647058823529413,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13479116559028625,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8168249660786975,
"eval_overall_precision": 0.7562814070351759,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3689,
"eval_samples_per_second": 506.907,
"eval_steps_per_second": 8.132,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 2.846377372741699,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0906,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7640449438202248,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6601941747572816,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9042904290429041,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14537392556667328,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8214765100671141,
"eval_overall_precision": 0.7536945812807881,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.678,
"eval_steps_per_second": 8.048,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.0936921834945679,
"learning_rate": 2.5e-05,
"loss": 0.0894,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7730061349693251,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7159090909090909,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8918032786885245,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13398553431034088,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8269230769230769,
"eval_overall_precision": 0.7737789203084833,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.87,
"eval_steps_per_second": 8.1,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 1.3817942142486572,
"learning_rate": 2.45e-05,
"loss": 0.0882,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7602339181286549,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6770833333333334,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1364634782075882,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8233695652173914,
"eval_overall_precision": 0.7632241813602015,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3697,
"eval_samples_per_second": 505.839,
"eval_steps_per_second": 8.115,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.8930407762527466,
"learning_rate": 2.4e-05,
"loss": 0.0886,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7701149425287357,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6767676767676768,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14068011939525604,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8221024258760108,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3699,
"eval_samples_per_second": 505.493,
"eval_steps_per_second": 8.11,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.4923311471939087,
"learning_rate": 2.35e-05,
"loss": 0.086,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7790697674418604,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6907216494845361,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8947368421052632,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13908393681049347,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8243243243243245,
"eval_overall_precision": 0.7605985037406484,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3682,
"eval_samples_per_second": 507.889,
"eval_steps_per_second": 8.148,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 2.1307640075683594,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0872,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1391591876745224,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8256130790190735,
"eval_overall_precision": 0.7670886075949367,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.825,
"eval_steps_per_second": 8.083,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 2.045675277709961,
"learning_rate": 2.25e-05,
"loss": 0.0897,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7640449438202248,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6601941747572816,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9078947368421052,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1569395512342453,
"eval_overall_accuracy": 0.9534650988241181,
"eval_overall_f1": 0.8133333333333332,
"eval_overall_precision": 0.7420924574209246,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3688,
"eval_samples_per_second": 507.118,
"eval_steps_per_second": 8.136,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.979404091835022,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0881,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13650928437709808,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8207934336525308,
"eval_overall_precision": 0.7653061224489796,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.372,
"eval_samples_per_second": 502.676,
"eval_steps_per_second": 8.064,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 1.4905277490615845,
"learning_rate": 2.15e-05,
"loss": 0.0857,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7333333333333333,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13628903031349182,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8273972602739725,
"eval_overall_precision": 0.7723785166240409,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.837,
"eval_steps_per_second": 8.099,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.8609861135482788,
"learning_rate": 2.1e-05,
"loss": 0.0846,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.783625730994152,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6979166666666666,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14013363420963287,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8233695652173914,
"eval_overall_precision": 0.7632241813602015,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3725,
"eval_samples_per_second": 502.031,
"eval_steps_per_second": 8.054,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 1.2671494483947754,
"learning_rate": 2.05e-05,
"loss": 0.0843,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7928994082840236,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7127659574468085,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9078947368421052,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14256823062896729,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8238482384823848,
"eval_overall_precision": 0.7619047619047619,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3732,
"eval_samples_per_second": 501.11,
"eval_steps_per_second": 8.039,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.5702971816062927,
"learning_rate": 2e-05,
"loss": 0.087,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13854016363620758,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8240109140518419,
"eval_overall_precision": 0.766497461928934,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.86,
"eval_steps_per_second": 8.099,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.0941648483276367,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0836,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7745664739884393,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6836734693877551,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9108910891089109,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14069223403930664,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.827027027027027,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3687,
"eval_samples_per_second": 507.138,
"eval_steps_per_second": 8.136,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.9212659597396851,
"learning_rate": 1.9e-05,
"loss": 0.0823,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7710843373493976,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7032967032967034,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13715825974941254,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.823045267489712,
"eval_overall_precision": 0.7692307692307693,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3668,
"eval_samples_per_second": 509.835,
"eval_steps_per_second": 8.179,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.8010810613632202,
"learning_rate": 1.85e-05,
"loss": 0.0814,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7674418604651163,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6804123711340206,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1415587216615677,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.814614343707713,
"eval_overall_precision": 0.7525,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.694,
"eval_steps_per_second": 8.081,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 1.7902244329452515,
"learning_rate": 1.8e-05,
"loss": 0.0806,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7486033519553071,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6442307692307693,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9078947368421052,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1516939103603363,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8155080213903745,
"eval_overall_precision": 0.7457212713936431,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.372,
"eval_samples_per_second": 502.674,
"eval_steps_per_second": 8.064,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.6327823400497437,
"learning_rate": 1.75e-05,
"loss": 0.0794,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7784431137724551,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7065217391304348,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14160560071468353,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8201634877384195,
"eval_overall_precision": 0.7620253164556962,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3687,
"eval_samples_per_second": 507.195,
"eval_steps_per_second": 8.137,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.9762814044952393,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.079,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7861271676300577,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6938775510204082,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9078947368421052,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1456669718027115,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8286099865047233,
"eval_overall_precision": 0.763681592039801,
"eval_overall_recall": 0.9056047197640118,
"eval_runtime": 0.3699,
"eval_samples_per_second": 505.498,
"eval_steps_per_second": 8.11,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.4873846173286438,
"learning_rate": 1.65e-05,
"loss": 0.0811,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13851337134838104,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8267394270122784,
"eval_overall_precision": 0.7690355329949239,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.102,
"eval_steps_per_second": 8.055,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.9525014758110046,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0792,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7570621468926553,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6568627450980392,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9072847682119206,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14804454147815704,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.814516129032258,
"eval_overall_precision": 0.7481481481481481,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.718,
"eval_steps_per_second": 8.081,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 2.1547799110412598,
"learning_rate": 1.55e-05,
"loss": 0.0795,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7701149425287357,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6767676767676768,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8918032786885245,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1455415040254593,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8198924731182796,
"eval_overall_precision": 0.7530864197530864,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3711,
"eval_samples_per_second": 503.946,
"eval_steps_per_second": 8.085,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.8800172805786133,
"learning_rate": 1.5e-05,
"loss": 0.0805,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14219874143600464,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8272108843537416,
"eval_overall_precision": 0.7676767676767676,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.365,
"eval_steps_per_second": 8.091,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 2.311293363571167,
"learning_rate": 1.45e-05,
"loss": 0.0809,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.788235294117647,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7052631578947368,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14474977552890778,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8265582655826559,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3706,
"eval_samples_per_second": 504.553,
"eval_steps_per_second": 8.094,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 1.1506495475769043,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0787,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7976190476190477,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7204301075268817,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1447576880455017,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8233695652173914,
"eval_overall_precision": 0.7632241813602015,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3738,
"eval_samples_per_second": 500.28,
"eval_steps_per_second": 8.026,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 1.78630793094635,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0792,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7590361445783131,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14058354496955872,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8224043715846995,
"eval_overall_precision": 0.7659033078880407,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3699,
"eval_samples_per_second": 505.587,
"eval_steps_per_second": 8.111,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.3375426530838013,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.078,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7857142857142856,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7096774193548387,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14712856709957123,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8179347826086957,
"eval_overall_precision": 0.7581863979848866,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3703,
"eval_samples_per_second": 505.025,
"eval_steps_per_second": 8.102,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 1.585189938545227,
"learning_rate": 1.25e-05,
"loss": 0.0773,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.783625730994152,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6979166666666666,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1459941565990448,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8227334235453315,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3706,
"eval_samples_per_second": 504.644,
"eval_steps_per_second": 8.096,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 1.1429756879806519,
"learning_rate": 1.2e-05,
"loss": 0.0772,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.783625730994152,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6979166666666666,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9042904290429041,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14840912818908691,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8265582655826559,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3692,
"eval_samples_per_second": 506.499,
"eval_steps_per_second": 8.126,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 1.014310359954834,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0767,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7790697674418604,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6907216494845361,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9072847682119206,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15152573585510254,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8227334235453315,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.318,
"eval_steps_per_second": 8.091,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 1.17866051197052,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0757,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7682926829268292,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7078651685393258,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14352728426456451,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8253094910591473,
"eval_overall_precision": 0.7731958762886598,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.374,
"eval_samples_per_second": 500.053,
"eval_steps_per_second": 8.022,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 2.2889716625213623,
"learning_rate": 1.05e-05,
"loss": 0.0767,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7904191616766466,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.717391304347826,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9042904290429041,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14561718702316284,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8267394270122784,
"eval_overall_precision": 0.7690355329949239,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.277,
"eval_steps_per_second": 8.09,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.5872527956962585,
"learning_rate": 1e-05,
"loss": 0.0752,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7570621468926553,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6568627450980392,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9042904290429041,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.15562912821769714,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.8161073825503355,
"eval_overall_precision": 0.7487684729064039,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3781,
"eval_samples_per_second": 494.629,
"eval_steps_per_second": 7.935,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 1.4843671321868896,
"learning_rate": 9.5e-06,
"loss": 0.078,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14394411444664001,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8238482384823848,
"eval_overall_precision": 0.7619047619047619,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3729,
"eval_samples_per_second": 501.415,
"eval_steps_per_second": 8.044,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.6159791946411133,
"learning_rate": 9e-06,
"loss": 0.0733,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.788235294117647,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7052631578947368,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.14782680571079254,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.817320703653586,
"eval_overall_precision": 0.755,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.893,
"eval_steps_per_second": 8.036,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 1.871289610862732,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0747,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14479823410511017,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8224043715846995,
"eval_overall_precision": 0.7659033078880407,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3747,
"eval_samples_per_second": 499.023,
"eval_steps_per_second": 8.006,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 2.436727285385132,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0755,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7928994082840236,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7127659574468085,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14651836454868317,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8233695652173914,
"eval_overall_precision": 0.7632241813602015,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3731,
"eval_samples_per_second": 501.201,
"eval_steps_per_second": 8.041,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 1.8641331195831299,
"learning_rate": 7.5e-06,
"loss": 0.0757,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7682926829268292,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7078651685393258,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14340606331825256,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8169398907103824,
"eval_overall_precision": 0.7608142493638677,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.795,
"eval_steps_per_second": 8.05,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 2.203537702560425,
"learning_rate": 7.000000000000001e-06,
"loss": 0.076,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7710843373493976,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7032967032967034,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1468215435743332,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8185538881309687,
"eval_overall_precision": 0.7614213197969543,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3717,
"eval_samples_per_second": 503.095,
"eval_steps_per_second": 8.071,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 1.147968053817749,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0721,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7710843373493976,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7032967032967034,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8947368421052632,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14543673396110535,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8212824010914053,
"eval_overall_precision": 0.7639593908629442,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.66,
"eval_steps_per_second": 8.08,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 1.8473503589630127,
"learning_rate": 6e-06,
"loss": 0.0724,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7784431137724551,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7065217391304348,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14697220921516418,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8240109140518419,
"eval_overall_precision": 0.766497461928934,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3718,
"eval_samples_per_second": 502.894,
"eval_steps_per_second": 8.068,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 1.6724920272827148,
"learning_rate": 5.500000000000001e-06,
"loss": 0.074,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14885887503623962,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8217687074829931,
"eval_overall_precision": 0.7626262626262627,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.288,
"eval_steps_per_second": 8.042,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.6046056747436523,
"learning_rate": 5e-06,
"loss": 0.0721,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14962825179100037,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.819538670284939,
"eval_overall_precision": 0.7587939698492462,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3743,
"eval_samples_per_second": 499.541,
"eval_steps_per_second": 8.014,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.5925461649894714,
"learning_rate": 4.5e-06,
"loss": 0.0766,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7664670658682634,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6956521739130435,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14539198577404022,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8125000000000001,
"eval_overall_precision": 0.7531486146095718,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3743,
"eval_samples_per_second": 499.533,
"eval_steps_per_second": 8.014,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 2.1363561153411865,
"learning_rate": 4.000000000000001e-06,
"loss": 0.075,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8947368421052632,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1483411341905594,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8184281842818428,
"eval_overall_precision": 0.7568922305764411,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3707,
"eval_samples_per_second": 504.407,
"eval_steps_per_second": 8.092,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.5211588144302368,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0713,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14794917404651642,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8168249660786975,
"eval_overall_precision": 0.7562814070351759,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.374,
"eval_samples_per_second": 500.047,
"eval_steps_per_second": 8.022,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.8026951551437378,
"learning_rate": 3e-06,
"loss": 0.0727,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9013157894736843,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1480274349451065,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8211382113821138,
"eval_overall_precision": 0.7593984962406015,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.809,
"eval_steps_per_second": 8.083,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.5980091691017151,
"learning_rate": 2.5e-06,
"loss": 0.0726,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7857142857142856,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7096774193548387,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8947368421052632,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14869406819343567,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.819538670284939,
"eval_overall_precision": 0.7587939698492462,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3746,
"eval_samples_per_second": 499.2,
"eval_steps_per_second": 8.009,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.48421594500541687,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0733,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14902207255363464,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.814111261872456,
"eval_overall_precision": 0.7537688442211056,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3742,
"eval_samples_per_second": 499.722,
"eval_steps_per_second": 8.017,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.8765180110931396,
"learning_rate": 1.5e-06,
"loss": 0.0721,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14730840921401978,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8157181571815718,
"eval_overall_precision": 0.7543859649122807,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3716,
"eval_samples_per_second": 503.173,
"eval_steps_per_second": 8.072,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.884979784488678,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0722,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14785435795783997,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8184281842818428,
"eval_overall_precision": 0.7568922305764411,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3715,
"eval_samples_per_second": 503.38,
"eval_steps_per_second": 8.076,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 1.1624181270599365,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0729,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14793308079242706,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8157181571815718,
"eval_overall_precision": 0.7543859649122807,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3726,
"eval_samples_per_second": 501.877,
"eval_steps_per_second": 8.051,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 1.330012559890747,
"learning_rate": 0.0,
"loss": 0.0718,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14785712957382202,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8184281842818428,
"eval_overall_precision": 0.7568922305764411,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3703,
"eval_samples_per_second": 504.948,
"eval_steps_per_second": 8.101,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4533533359897542.0,
"train_loss": 0.12740072155898471,
"train_runtime": 632.9493,
"train_samples_per_second": 266.53,
"train_steps_per_second": 16.747
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4533533359897542.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}