{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 1.7605067491531372, "learning_rate": 4.9500000000000004e-05, "loss": 0.9861, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.012820512820512822, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.07692307692307693, "eval_PERSON_recall": 0.006993006993006993, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 26, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.5554673075675964, "eval_overall_accuracy": 0.8468851638729047, "eval_overall_f1": 0.0055248618784530384, "eval_overall_precision": 0.043478260869565216, "eval_overall_recall": 0.0029498525073746312, "eval_runtime": 0.9128, "eval_samples_per_second": 204.873, "eval_steps_per_second": 3.287, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.7613551616668701, "learning_rate": 4.9e-05, "loss": 0.5078, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.2150537634408602, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.47619047619047616, "eval_LOCATION_recall": 0.1388888888888889, "eval_ORGANIZATION_f1": 0.019417475728155338, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.03571428571428571, "eval_ORGANIZATION_recall": 0.013333333333333334, "eval_PERSON_f1": 0.6392961876832844, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.5505050505050505, "eval_PERSON_recall": 0.7622377622377622, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.6206896551724138, "eval_TIME_number": 26, "eval_TIME_precision": 0.5625, "eval_TIME_recall": 0.6923076923076923, "eval_loss": 0.3412609398365021, "eval_overall_accuracy": 0.8961721290968226, "eval_overall_f1": 0.43740095087163233, "eval_overall_precision": 0.4726027397260274, "eval_overall_recall": 0.40707964601769914, "eval_runtime": 0.9577, "eval_samples_per_second": 195.257, "eval_steps_per_second": 3.132, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.2087492942810059, "learning_rate": 4.85e-05, "loss": 0.3115, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.5696969696969698, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.5053763440860215, "eval_LOCATION_recall": 0.6527777777777778, "eval_ORGANIZATION_f1": 0.5125628140703519, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.4112903225806452, "eval_ORGANIZATION_recall": 0.68, "eval_PERSON_f1": 0.8231511254019294, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.7619047619047619, "eval_PERSON_recall": 0.8951048951048951, "eval_QUANTITY_f1": 0.4590163934426229, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.3684210526315789, "eval_QUANTITY_recall": 0.6086956521739131, "eval_TIME_f1": 0.7777777777777779, "eval_TIME_number": 26, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.22766432166099548, "eval_overall_accuracy": 0.9256942707030272, "eval_overall_f1": 0.6607594936708862, "eval_overall_precision": 0.5787139689578714, "eval_overall_recall": 0.7699115044247787, "eval_runtime": 0.9809, "eval_samples_per_second": 190.638, "eval_steps_per_second": 3.058, "step": 318 }, { "epoch": 4.0, "grad_norm": 0.9383460283279419, "learning_rate": 4.8e-05, "loss": 0.2203, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.6993865030674847, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.6263736263736264, "eval_LOCATION_recall": 0.7916666666666666, "eval_ORGANIZATION_f1": 0.6162790697674418, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.5463917525773195, "eval_ORGANIZATION_recall": 0.7066666666666667, "eval_PERSON_f1": 0.8498402555910544, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.7823529411764706, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.410958904109589, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.3, "eval_QUANTITY_recall": 0.6521739130434783, "eval_TIME_f1": 0.7419354838709676, "eval_TIME_number": 26, "eval_TIME_precision": 0.6388888888888888, "eval_TIME_recall": 0.8846153846153846, "eval_loss": 0.21552342176437378, "eval_overall_accuracy": 0.9316987740805605, "eval_overall_f1": 0.7177522349936143, "eval_overall_precision": 0.6328828828828829, "eval_overall_recall": 0.8289085545722714, "eval_runtime": 0.9352, "eval_samples_per_second": 199.955, "eval_steps_per_second": 3.208, "step": 424 }, { "epoch": 5.0, "grad_norm": 2.1988296508789062, "learning_rate": 4.75e-05, "loss": 0.1816, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7516778523489932, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7272727272727273, "eval_LOCATION_recall": 0.7777777777777778, "eval_ORGANIZATION_f1": 0.6553672316384181, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.5686274509803921, "eval_ORGANIZATION_recall": 0.7733333333333333, "eval_PERSON_f1": 0.8794788273615636, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.823170731707317, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7142857142857143, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6060606060606061, "eval_QUANTITY_recall": 0.8695652173913043, "eval_TIME_f1": 0.9230769230769231, "eval_TIME_number": 26, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.9230769230769231, "eval_loss": 0.15413647890090942, "eval_overall_accuracy": 0.9489617212909682, "eval_overall_f1": 0.7908232118758435, "eval_overall_precision": 0.7288557213930348, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9063, "eval_samples_per_second": 206.339, "eval_steps_per_second": 3.31, "step": 530 }, { "epoch": 6.0, "grad_norm": 0.9543836116790771, "learning_rate": 4.7e-05, "loss": 0.1655, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7317073170731708, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.6521739130434783, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7078651685393258, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6116504854368932, "eval_ORGANIZATION_recall": 0.84, "eval_PERSON_f1": 0.8918032786885245, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.951048951048951, "eval_QUANTITY_f1": 0.6909090909090908, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.59375, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7241379310344829, "eval_TIME_number": 26, "eval_TIME_precision": 0.65625, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.15523788332939148, "eval_overall_accuracy": 0.9504628471353516, "eval_overall_f1": 0.7868421052631579, "eval_overall_precision": 0.7102137767220903, "eval_overall_recall": 0.8820058997050148, "eval_runtime": 0.9116, "eval_samples_per_second": 205.138, "eval_steps_per_second": 3.291, "step": 636 }, { "epoch": 7.0, "grad_norm": 0.4434598982334137, "learning_rate": 4.6500000000000005e-05, "loss": 0.1513, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7631578947368423, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7111111111111111, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6095238095238096, "eval_ORGANIZATION_recall": 0.8533333333333334, "eval_PERSON_f1": 0.8758169934640523, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8220858895705522, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7017543859649124, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5882352941176471, "eval_QUANTITY_recall": 0.8695652173913043, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.14643213152885437, "eval_overall_accuracy": 0.952964723542657, "eval_overall_f1": 0.7882822902796273, "eval_overall_precision": 0.7184466019417476, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9227, "eval_samples_per_second": 202.669, "eval_steps_per_second": 3.251, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.7223401069641113, "learning_rate": 4.600000000000001e-05, "loss": 0.1403, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.7916666666666666, "eval_ORGANIZATION_f1": 0.7093023255813953, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6288659793814433, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8829431438127091, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8461538461538461, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.8695652173913043, "eval_TIME_f1": 0.6779661016949152, "eval_TIME_number": 26, "eval_TIME_precision": 0.6060606060606061, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.14050298929214478, "eval_overall_accuracy": 0.9542156617463098, "eval_overall_f1": 0.7880434782608694, "eval_overall_precision": 0.7304785894206549, "eval_overall_recall": 0.855457227138643, "eval_runtime": 0.9407, "eval_samples_per_second": 198.786, "eval_steps_per_second": 3.189, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.0728905200958252, "learning_rate": 4.55e-05, "loss": 0.138, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.8079470198675496, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.711864406779661, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6176470588235294, "eval_ORGANIZATION_recall": 0.84, "eval_PERSON_f1": 0.9066666666666667, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8662420382165605, "eval_PERSON_recall": 0.951048951048951, "eval_QUANTITY_f1": 0.7169811320754716, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6333333333333333, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.75, "eval_TIME_number": 26, "eval_TIME_precision": 0.7, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.14766837656497955, "eval_overall_accuracy": 0.9527145359019265, "eval_overall_f1": 0.814111261872456, "eval_overall_precision": 0.7537688442211056, "eval_overall_recall": 0.8849557522123894, "eval_runtime": 0.9393, "eval_samples_per_second": 199.079, "eval_steps_per_second": 3.194, "step": 954 }, { "epoch": 10.0, "grad_norm": 2.3210840225219727, "learning_rate": 4.5e-05, "loss": 0.1301, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7349397590361445, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6703296703296703, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8940397350993377, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8490566037735849, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5588235294117647, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.75, "eval_TIME_number": 26, "eval_TIME_precision": 0.7, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.13562895357608795, "eval_overall_accuracy": 0.9564673505128847, "eval_overall_f1": 0.8098495212038302, "eval_overall_precision": 0.7551020408163265, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9309, "eval_samples_per_second": 200.881, "eval_steps_per_second": 3.223, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.8354237675666809, "learning_rate": 4.4500000000000004e-05, "loss": 0.12, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7733333333333334, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7682926829268292, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7078651685393258, "eval_ORGANIZATION_recall": 0.84, "eval_PERSON_f1": 0.8926174496644295, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8580645161290322, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.7037037037037037, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6129032258064516, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.12984243035316467, "eval_overall_accuracy": 0.9587190392794596, "eval_overall_f1": 0.8155339805825244, "eval_overall_precision": 0.7696335078534031, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9242, "eval_samples_per_second": 202.333, "eval_steps_per_second": 3.246, "step": 1166 }, { "epoch": 12.0, "grad_norm": 2.3830783367156982, "learning_rate": 4.4000000000000006e-05, "loss": 0.1171, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7945205479452055, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7837837837837838, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7195121951219511, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6629213483146067, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8844884488448846, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8375, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6428571428571429, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5454545454545454, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.8461538461538461, "eval_TIME_number": 26, "eval_TIME_precision": 0.8461538461538461, "eval_TIME_recall": 0.8461538461538461, "eval_loss": 0.13061821460723877, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8072122052704578, "eval_overall_precision": 0.7617801047120419, "eval_overall_recall": 0.8584070796460177, "eval_runtime": 0.9196, "eval_samples_per_second": 203.355, "eval_steps_per_second": 3.262, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.5705311894416809, "learning_rate": 4.35e-05, "loss": 0.1129, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.781456953642384, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7597765363128492, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6538461538461539, "eval_ORGANIZATION_recall": 0.9066666666666666, "eval_PERSON_f1": 0.8940397350993377, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8490566037735849, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7142857142857143, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6060606060606061, "eval_QUANTITY_recall": 0.8695652173913043, "eval_TIME_f1": 0.7857142857142856, "eval_TIME_number": 26, "eval_TIME_precision": 0.7333333333333333, "eval_TIME_recall": 0.8461538461538461, "eval_loss": 0.13694216310977936, "eval_overall_accuracy": 0.9564673505128847, "eval_overall_f1": 0.8172043010752689, "eval_overall_precision": 0.7506172839506173, "eval_overall_recall": 0.8967551622418879, "eval_runtime": 0.9213, "eval_samples_per_second": 202.983, "eval_steps_per_second": 3.256, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.2299761772155762, "learning_rate": 4.3e-05, "loss": 0.1076, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7662337662337663, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7613636363636365, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6633663366336634, "eval_ORGANIZATION_recall": 0.8933333333333333, "eval_PERSON_f1": 0.8910891089108911, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.84375, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6206896551724138, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5142857142857142, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7241379310344829, "eval_TIME_number": 26, "eval_TIME_precision": 0.65625, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.1426171064376831, "eval_overall_accuracy": 0.9524643482611959, "eval_overall_f1": 0.8064516129032259, "eval_overall_precision": 0.7407407407407407, "eval_overall_recall": 0.8849557522123894, "eval_runtime": 0.9372, "eval_samples_per_second": 199.528, "eval_steps_per_second": 3.201, "step": 1484 }, { "epoch": 15.0, "grad_norm": 0.628875732421875, "learning_rate": 4.25e-05, "loss": 0.1056, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.8082191780821918, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7972972972972973, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7674418604651163, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6804123711340206, "eval_ORGANIZATION_recall": 0.88, "eval_PERSON_f1": 0.8859060402684563, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8516129032258064, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.6181818181818182, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.53125, "eval_QUANTITY_recall": 0.7391304347826086, "eval_TIME_f1": 0.8214285714285715, "eval_TIME_number": 26, "eval_TIME_precision": 0.7666666666666667, "eval_TIME_recall": 0.8846153846153846, "eval_loss": 0.1336900293827057, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.8170563961485556, "eval_overall_precision": 0.7654639175257731, "eval_overall_recall": 0.8761061946902655, "eval_runtime": 0.9357, "eval_samples_per_second": 199.851, "eval_steps_per_second": 3.206, "step": 1590 }, { "epoch": 16.0, "grad_norm": 0.9760724902153015, "learning_rate": 4.2e-05, "loss": 0.1003, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7657142857142857, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.67, "eval_ORGANIZATION_recall": 0.8933333333333333, "eval_PERSON_f1": 0.8963210702341137, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8589743589743589, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6785714285714286, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5757575757575758, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.75, "eval_TIME_number": 26, "eval_TIME_precision": 0.7, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.145399808883667, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8206521739130435, "eval_overall_precision": 0.760705289672544, "eval_overall_recall": 0.8908554572271387, "eval_runtime": 0.9425, "eval_samples_per_second": 198.413, "eval_steps_per_second": 3.183, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.18460078537464142, "learning_rate": 4.15e-05, "loss": 0.0997, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7602339181286549, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6770833333333334, "eval_ORGANIZATION_recall": 0.8666666666666667, "eval_PERSON_f1": 0.8851351351351351, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8562091503267973, "eval_PERSON_recall": 0.916083916083916, "eval_QUANTITY_f1": 0.6428571428571429, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5454545454545454, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1395619809627533, "eval_overall_accuracy": 0.955716787590693, "eval_overall_f1": 0.8076923076923076, "eval_overall_precision": 0.7557840616966581, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.923, "eval_samples_per_second": 202.596, "eval_steps_per_second": 3.25, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.43792226910591125, "learning_rate": 4.1e-05, "loss": 0.0956, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8169014084507044, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8285714285714286, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.726190476190476, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6559139784946236, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8926174496644295, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8580645161290322, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6909090909090908, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.59375, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.13341191411018372, "eval_overall_accuracy": 0.9587190392794596, "eval_overall_f1": 0.8133704735376045, "eval_overall_precision": 0.7704485488126649, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.9563, "eval_samples_per_second": 195.551, "eval_steps_per_second": 3.137, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.8807380795478821, "learning_rate": 4.05e-05, "loss": 0.0906, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7945205479452054, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7542857142857142, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.66, "eval_ORGANIZATION_recall": 0.88, "eval_PERSON_f1": 0.8926174496644295, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8580645161290322, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6428571428571429, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5454545454545454, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.13378730416297913, "eval_overall_accuracy": 0.9572179134350763, "eval_overall_f1": 0.8120713305898491, "eval_overall_precision": 0.7589743589743589, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9383, "eval_samples_per_second": 199.303, "eval_steps_per_second": 3.197, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.726658046245575, "learning_rate": 4e-05, "loss": 0.0876, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.8187919463087249, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7727272727272727, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6732673267326733, "eval_ORGANIZATION_recall": 0.9066666666666666, "eval_PERSON_f1": 0.881578947368421, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8322981366459627, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6909090909090908, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.59375, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.1531873345375061, "eval_overall_accuracy": 0.9564673505128847, "eval_overall_f1": 0.8200270635994586, "eval_overall_precision": 0.7575, "eval_overall_recall": 0.8938053097345132, "eval_runtime": 0.9428, "eval_samples_per_second": 198.355, "eval_steps_per_second": 3.182, "step": 2120 }, { "epoch": 21.0, "grad_norm": 1.286189317703247, "learning_rate": 3.9500000000000005e-05, "loss": 0.0841, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.8079470198675496, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7560975609756098, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6966292134831461, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8866666666666668, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8471337579617835, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6428571428571429, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5454545454545454, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.1474735289812088, "eval_overall_accuracy": 0.9567175381536153, "eval_overall_f1": 0.8126721763085399, "eval_overall_precision": 0.7622739018087855, "eval_overall_recall": 0.8702064896755162, "eval_runtime": 0.9368, "eval_samples_per_second": 199.611, "eval_steps_per_second": 3.202, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.40452536940574646, "learning_rate": 3.9000000000000006e-05, "loss": 0.0842, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7861271676300577, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6938775510204082, "eval_ORGANIZATION_recall": 0.9066666666666666, "eval_PERSON_f1": 0.8970099667774087, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8544303797468354, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6428571428571429, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5454545454545454, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.13896140456199646, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.8228882833787466, "eval_overall_precision": 0.7645569620253164, "eval_overall_recall": 0.8908554572271387, "eval_runtime": 0.9322, "eval_samples_per_second": 200.611, "eval_steps_per_second": 3.218, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.6667360663414001, "learning_rate": 3.85e-05, "loss": 0.0798, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.7945205479452055, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7837837837837838, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7666666666666667, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.92, "eval_PERSON_f1": 0.8933333333333333, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8535031847133758, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.631578947368421, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5294117647058824, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7777777777777779, "eval_TIME_number": 26, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.15068964660167694, "eval_overall_accuracy": 0.9542156617463098, "eval_overall_f1": 0.814111261872456, "eval_overall_precision": 0.7537688442211056, "eval_overall_recall": 0.8849557522123894, "eval_runtime": 1.0035, "eval_samples_per_second": 186.346, "eval_steps_per_second": 2.99, "step": 2438 }, { "epoch": 24.0, "grad_norm": 0.6917049884796143, "learning_rate": 3.8e-05, "loss": 0.0775, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7894736842105263, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7721518987341773, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7349397590361446, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8970099667774087, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8544303797468354, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7692307692307693, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6896551724137931, "eval_QUANTITY_recall": 0.8695652173913043, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.14417295157909393, "eval_overall_accuracy": 0.9604703527645734, "eval_overall_f1": 0.8319327731092437, "eval_overall_precision": 0.792, "eval_overall_recall": 0.8761061946902655, "eval_runtime": 0.9311, "eval_samples_per_second": 200.829, "eval_steps_per_second": 3.222, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.38176143169403076, "learning_rate": 3.7500000000000003e-05, "loss": 0.0759, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8322147651006712, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.783625730994152, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6979166666666666, "eval_ORGANIZATION_recall": 0.8933333333333333, "eval_PERSON_f1": 0.8963210702341137, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8589743589743589, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6440677966101694, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5277777777777778, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7368421052631579, "eval_TIME_number": 26, "eval_TIME_precision": 0.6774193548387096, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.14586655795574188, "eval_overall_accuracy": 0.9582186639979985, "eval_overall_f1": 0.8244897959183674, "eval_overall_precision": 0.7651515151515151, "eval_overall_recall": 0.8938053097345132, "eval_runtime": 0.9333, "eval_samples_per_second": 200.36, "eval_steps_per_second": 3.214, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.690096914768219, "learning_rate": 3.7e-05, "loss": 0.0731, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7945205479452054, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7975460122699386, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7386363636363636, "eval_ORGANIZATION_recall": 0.8666666666666667, "eval_PERSON_f1": 0.8940397350993377, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8490566037735849, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7169811320754716, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6333333333333333, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7777777777777779, "eval_TIME_number": 26, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.151327446103096, "eval_overall_accuracy": 0.9587190392794596, "eval_overall_f1": 0.8312412831241284, "eval_overall_precision": 0.7883597883597884, "eval_overall_recall": 0.8790560471976401, "eval_runtime": 0.9254, "eval_samples_per_second": 202.071, "eval_steps_per_second": 3.242, "step": 2756 }, { "epoch": 27.0, "grad_norm": 0.562192440032959, "learning_rate": 3.65e-05, "loss": 0.0714, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7891156462585034, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7733333333333333, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7654320987654321, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7126436781609196, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8903654485049833, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8481012658227848, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.76, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.7037037037037037, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.15548019111156464, "eval_overall_accuracy": 0.9577182887165374, "eval_overall_f1": 0.8207282913165266, "eval_overall_precision": 0.7813333333333333, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9366, "eval_samples_per_second": 199.663, "eval_steps_per_second": 3.203, "step": 2862 }, { "epoch": 28.0, "grad_norm": 1.1344366073608398, "learning_rate": 3.6e-05, "loss": 0.0697, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.7808219178082192, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7702702702702703, "eval_LOCATION_recall": 0.7916666666666666, "eval_ORGANIZATION_f1": 0.7607361963190183, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7045454545454546, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8993288590604027, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.864516129032258, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7450980392156864, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6785714285714286, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.14587517082691193, "eval_overall_accuracy": 0.9587190392794596, "eval_overall_f1": 0.8202247191011236, "eval_overall_precision": 0.7828418230563002, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.92, "eval_samples_per_second": 203.25, "eval_steps_per_second": 3.261, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.7924529910087585, "learning_rate": 3.55e-05, "loss": 0.0701, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.8356164383561645, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8243243243243243, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7176470588235295, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6421052631578947, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8986486486486487, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.869281045751634, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.5862068965517241, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.4857142857142857, "eval_QUANTITY_recall": 0.7391304347826086, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1690864861011505, "eval_overall_accuracy": 0.9532149111833875, "eval_overall_f1": 0.8055172413793102, "eval_overall_precision": 0.7564766839378239, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.929, "eval_samples_per_second": 201.295, "eval_steps_per_second": 3.229, "step": 3074 }, { "epoch": 30.0, "grad_norm": 1.1464416980743408, "learning_rate": 3.5e-05, "loss": 0.0678, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.8251748251748252, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8309859154929577, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7484662576687117, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6931818181818182, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8963210702341137, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8589743589743589, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7450980392156864, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6785714285714286, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7857142857142856, "eval_TIME_number": 26, "eval_TIME_precision": 0.7333333333333333, "eval_TIME_recall": 0.8461538461538461, "eval_loss": 0.14405371248722076, "eval_overall_accuracy": 0.9582186639979985, "eval_overall_f1": 0.8286516853932584, "eval_overall_precision": 0.7908847184986595, "eval_overall_recall": 0.8702064896755162, "eval_runtime": 1.0504, "eval_samples_per_second": 178.034, "eval_steps_per_second": 2.856, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.38195714354515076, "learning_rate": 3.45e-05, "loss": 0.0658, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.8322147651006712, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7861271676300577, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6938775510204082, "eval_ORGANIZATION_recall": 0.9066666666666666, "eval_PERSON_f1": 0.8993288590604027, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.864516129032258, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7755102040816326, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.7307692307692307, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.15743257105350494, "eval_overall_accuracy": 0.9584688516387291, "eval_overall_f1": 0.8381742738589212, "eval_overall_precision": 0.7890625, "eval_overall_recall": 0.8938053097345132, "eval_runtime": 0.9177, "eval_samples_per_second": 203.771, "eval_steps_per_second": 3.269, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.8308860659599304, "learning_rate": 3.4000000000000007e-05, "loss": 0.0648, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.8428571428571429, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8676470588235294, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7619047619047621, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6881720430107527, "eval_ORGANIZATION_recall": 0.8533333333333334, "eval_PERSON_f1": 0.9016949152542374, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.7169811320754716, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6333333333333333, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.8, "eval_TIME_number": 26, "eval_TIME_precision": 0.7586206896551724, "eval_TIME_recall": 0.8461538461538461, "eval_loss": 0.1516529768705368, "eval_overall_accuracy": 0.9597197898423818, "eval_overall_f1": 0.8354430379746836, "eval_overall_precision": 0.7983870967741935, "eval_overall_recall": 0.8761061946902655, "eval_runtime": 1.0211, "eval_samples_per_second": 183.135, "eval_steps_per_second": 2.938, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.37685203552246094, "learning_rate": 3.35e-05, "loss": 0.0626, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.7945205479452055, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7837837837837838, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7810650887573964, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7021276595744681, "eval_ORGANIZATION_recall": 0.88, "eval_PERSON_f1": 0.9016949152542374, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.75, "eval_TIME_number": 26, "eval_TIME_precision": 0.7, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.15304860472679138, "eval_overall_accuracy": 0.9584688516387291, "eval_overall_f1": 0.82336578581363, "eval_overall_precision": 0.7789473684210526, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9446, "eval_samples_per_second": 197.961, "eval_steps_per_second": 3.176, "step": 3498 }, { "epoch": 34.0, "grad_norm": 1.1034225225448608, "learning_rate": 3.3e-05, "loss": 0.0631, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8378378378378377, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7953216374269007, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7083333333333334, "eval_ORGANIZATION_recall": 0.9066666666666666, "eval_PERSON_f1": 0.903010033444816, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8653846153846154, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6545454545454547, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7241379310344829, "eval_TIME_number": 26, "eval_TIME_precision": 0.65625, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.16854536533355713, "eval_overall_accuracy": 0.9572179134350763, "eval_overall_f1": 0.8317373461012312, "eval_overall_precision": 0.7755102040816326, "eval_overall_recall": 0.8967551622418879, "eval_runtime": 0.937, "eval_samples_per_second": 199.569, "eval_steps_per_second": 3.202, "step": 3604 }, { "epoch": 35.0, "grad_norm": 1.6754740476608276, "learning_rate": 3.2500000000000004e-05, "loss": 0.0598, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.8707482993197277, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8533333333333334, "eval_LOCATION_recall": 0.8888888888888888, "eval_ORGANIZATION_f1": 0.7784431137724551, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7065217391304348, "eval_ORGANIZATION_recall": 0.8666666666666667, "eval_PERSON_f1": 0.8986486486486487, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.869281045751634, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.631578947368421, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5294117647058824, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1640816181898117, "eval_overall_accuracy": 0.957968476357268, "eval_overall_f1": 0.8333333333333335, "eval_overall_precision": 0.7874015748031497, "eval_overall_recall": 0.8849557522123894, "eval_runtime": 0.9325, "eval_samples_per_second": 200.545, "eval_steps_per_second": 3.217, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.5667424201965332, "learning_rate": 3.2000000000000005e-05, "loss": 0.06, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.8053691275167787, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7738095238095238, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6989247311827957, "eval_ORGANIZATION_recall": 0.8666666666666667, "eval_PERSON_f1": 0.8963210702341137, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8589743589743589, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7346938775510203, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.75, "eval_TIME_number": 26, "eval_TIME_precision": 0.7, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.1585589498281479, "eval_overall_accuracy": 0.9589692269201902, "eval_overall_f1": 0.826629680998613, "eval_overall_precision": 0.7801047120418848, "eval_overall_recall": 0.8790560471976401, "eval_runtime": 0.9262, "eval_samples_per_second": 201.894, "eval_steps_per_second": 3.239, "step": 3816 }, { "epoch": 37.0, "grad_norm": 2.2813751697540283, "learning_rate": 3.15e-05, "loss": 0.0564, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.8322147651006712, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7701149425287357, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6767676767676768, "eval_ORGANIZATION_recall": 0.8933333333333333, "eval_PERSON_f1": 0.8993288590604027, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.864516129032258, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.75, "eval_TIME_number": 26, "eval_TIME_precision": 0.7, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.16692771017551422, "eval_overall_accuracy": 0.9594696022016512, "eval_overall_f1": 0.8296703296703297, "eval_overall_precision": 0.7763496143958869, "eval_overall_recall": 0.8908554572271387, "eval_runtime": 0.9304, "eval_samples_per_second": 200.987, "eval_steps_per_second": 3.224, "step": 3922 }, { "epoch": 38.0, "grad_norm": 1.5005148649215698, "learning_rate": 3.1e-05, "loss": 0.0583, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8169014084507044, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8285714285714286, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7721518987341773, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7349397590361446, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.9090909090909092, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8766233766233766, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.72, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7924528301886792, "eval_TIME_number": 26, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.15361984074115753, "eval_overall_accuracy": 0.960720540405304, "eval_overall_f1": 0.8371428571428572, "eval_overall_precision": 0.8116343490304709, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9285, "eval_samples_per_second": 201.402, "eval_steps_per_second": 3.231, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.37653887271881104, "learning_rate": 3.05e-05, "loss": 0.0545, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.8111888111888113, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8169014084507042, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7647058823529413, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6842105263157895, "eval_ORGANIZATION_recall": 0.8666666666666667, "eval_PERSON_f1": 0.9, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8598726114649682, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7307692307692308, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6551724137931034, "eval_QUANTITY_recall": 0.8260869565217391, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.16966940462589264, "eval_overall_accuracy": 0.957968476357268, "eval_overall_f1": 0.8261474269819195, "eval_overall_precision": 0.781578947368421, "eval_overall_recall": 0.8761061946902655, "eval_runtime": 0.9372, "eval_samples_per_second": 199.533, "eval_steps_per_second": 3.201, "step": 4134 }, { "epoch": 40.0, "grad_norm": 1.0764912366867065, "learning_rate": 3e-05, "loss": 0.0555, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.7784431137724551, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7065217391304348, "eval_ORGANIZATION_recall": 0.8666666666666667, "eval_PERSON_f1": 0.8963210702341137, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8589743589743589, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.6896551724137931, "eval_TIME_number": 26, "eval_TIME_precision": 0.625, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.16699136793613434, "eval_overall_accuracy": 0.9587190392794596, "eval_overall_f1": 0.8275862068965517, "eval_overall_precision": 0.7772020725388601, "eval_overall_recall": 0.8849557522123894, "eval_runtime": 0.9355, "eval_samples_per_second": 199.887, "eval_steps_per_second": 3.207, "step": 4240 }, { "epoch": 41.0, "grad_norm": 1.2565559148788452, "learning_rate": 2.95e-05, "loss": 0.0536, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.8513513513513513, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.7928994082840236, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7127659574468085, "eval_ORGANIZATION_recall": 0.8933333333333333, "eval_PERSON_f1": 0.8963210702341137, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8589743589743589, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.72, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7368421052631579, "eval_TIME_number": 26, "eval_TIME_precision": 0.6774193548387096, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.16643501818180084, "eval_overall_accuracy": 0.9599699774831123, "eval_overall_f1": 0.8381742738589212, "eval_overall_precision": 0.7890625, "eval_overall_recall": 0.8938053097345132, "eval_runtime": 0.9907, "eval_samples_per_second": 188.749, "eval_steps_per_second": 3.028, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.8656229376792908, "learning_rate": 2.9e-05, "loss": 0.0528, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8827586206896552, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8767123287671232, "eval_LOCATION_recall": 0.8888888888888888, "eval_ORGANIZATION_f1": 0.7607361963190183, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7045454545454546, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.903010033444816, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8653846153846154, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6206896551724138, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5142857142857142, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1719001978635788, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8305555555555555, "eval_overall_precision": 0.7847769028871391, "eval_overall_recall": 0.8820058997050148, "eval_runtime": 0.9302, "eval_samples_per_second": 201.029, "eval_steps_per_second": 3.225, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.4717106819152832, "learning_rate": 2.8499999999999998e-05, "loss": 0.0505, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.8413793103448277, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8356164383561644, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7469879518072289, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6813186813186813, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8926174496644295, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8580645161290322, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6428571428571429, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5454545454545454, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1703517884016037, "eval_overall_accuracy": 0.9552164123092319, "eval_overall_f1": 0.8166666666666667, "eval_overall_precision": 0.7716535433070866, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9281, "eval_samples_per_second": 201.476, "eval_steps_per_second": 3.232, "step": 4558 }, { "epoch": 44.0, "grad_norm": 0.6283421516418457, "learning_rate": 2.8000000000000003e-05, "loss": 0.05, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8053691275167787, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7607361963190183, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7045454545454546, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.903010033444816, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8653846153846154, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.16587650775909424, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8205841446453408, "eval_overall_precision": 0.7763157894736842, "eval_overall_recall": 0.8702064896755162, "eval_runtime": 0.933, "eval_samples_per_second": 200.427, "eval_steps_per_second": 3.215, "step": 4664 }, { "epoch": 45.0, "grad_norm": 0.7488293051719666, "learning_rate": 2.7500000000000004e-05, "loss": 0.0515, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8611111111111112, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.759493670886076, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7228915662650602, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8874172185430464, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8427672955974843, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.631578947368421, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5294117647058824, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17817422747612, "eval_overall_accuracy": 0.9544658493870403, "eval_overall_f1": 0.8223776223776224, "eval_overall_precision": 0.7819148936170213, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9321, "eval_samples_per_second": 200.616, "eval_steps_per_second": 3.218, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.3455760180950165, "learning_rate": 2.7000000000000002e-05, "loss": 0.0484, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8356164383561645, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8243243243243243, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7672955974842767, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7261904761904762, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8750000000000001, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8260869565217391, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1757228672504425, "eval_overall_accuracy": 0.9549662246685013, "eval_overall_f1": 0.8195804195804196, "eval_overall_precision": 0.7792553191489362, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9328, "eval_samples_per_second": 200.479, "eval_steps_per_second": 3.216, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.9659437537193298, "learning_rate": 2.6500000000000004e-05, "loss": 0.0477, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.8413793103448277, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8356164383561644, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7547169811320756, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8844884488448846, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8375, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6545454545454547, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17942465841770172, "eval_overall_accuracy": 0.9549662246685013, "eval_overall_f1": 0.8172942817294282, "eval_overall_precision": 0.7751322751322751, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9384, "eval_samples_per_second": 199.28, "eval_steps_per_second": 3.197, "step": 4982 }, { "epoch": 48.0, "grad_norm": 0.39018484950065613, "learning_rate": 2.6000000000000002e-05, "loss": 0.0456, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8472222222222222, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8472222222222222, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.779874213836478, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7380952380952381, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.9060402684563759, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8709677419354839, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.16816405951976776, "eval_overall_accuracy": 0.9609707280460346, "eval_overall_f1": 0.8373408769448375, "eval_overall_precision": 0.8043478260869565, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9286, "eval_samples_per_second": 201.387, "eval_steps_per_second": 3.231, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.4282808303833008, "learning_rate": 2.5500000000000003e-05, "loss": 0.0458, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.863013698630137, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.7052023121387283, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6224489795918368, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8903654485049833, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8481012658227848, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6545454545454547, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.18153227865695953, "eval_overall_accuracy": 0.9547160370277709, "eval_overall_f1": 0.8131868131868133, "eval_overall_precision": 0.7609254498714653, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.927, "eval_samples_per_second": 201.727, "eval_steps_per_second": 3.236, "step": 5194 }, { "epoch": 50.0, "grad_norm": 0.5775999426841736, "learning_rate": 2.5e-05, "loss": 0.0449, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.728395061728395, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6781609195402298, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.9054054054054055, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8758169934640523, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5806451612903226, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17358513176441193, "eval_overall_accuracy": 0.9577182887165374, "eval_overall_f1": 0.8223776223776224, "eval_overall_precision": 0.7819148936170213, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9332, "eval_samples_per_second": 200.395, "eval_steps_per_second": 3.215, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.8392077684402466, "learning_rate": 2.45e-05, "loss": 0.0443, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.8378378378378377, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7636363636363636, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7, "eval_ORGANIZATION_recall": 0.84, "eval_PERSON_f1": 0.8721311475409836, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17768125236034393, "eval_overall_accuracy": 0.9572179134350763, "eval_overall_f1": 0.8188105117565698, "eval_overall_precision": 0.7708333333333334, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9419, "eval_samples_per_second": 198.534, "eval_steps_per_second": 3.185, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.5880552530288696, "learning_rate": 2.4e-05, "loss": 0.044, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8648648648648649, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.8888888888888888, "eval_ORGANIZATION_f1": 0.7484662576687117, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6931818181818182, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.9023569023569024, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8701298701298701, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17750605940818787, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8296089385474861, "eval_overall_precision": 0.7877984084880637, "eval_overall_recall": 0.8761061946902655, "eval_runtime": 0.9391, "eval_samples_per_second": 199.121, "eval_steps_per_second": 3.194, "step": 5512 }, { "epoch": 53.0, "grad_norm": 0.7479882836341858, "learning_rate": 2.35e-05, "loss": 0.0436, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.8648648648648649, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.8888888888888888, "eval_ORGANIZATION_f1": 0.7469879518072289, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6813186813186813, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8933333333333333, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8535031847133758, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6545454545454547, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17619207501411438, "eval_overall_accuracy": 0.9572179134350763, "eval_overall_f1": 0.8220689655172414, "eval_overall_precision": 0.772020725388601, "eval_overall_recall": 0.8790560471976401, "eval_runtime": 0.9329, "eval_samples_per_second": 200.454, "eval_steps_per_second": 3.216, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.6151536703109741, "learning_rate": 2.3000000000000003e-05, "loss": 0.0416, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8611111111111112, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7393939393939395, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6777777777777778, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8844884488448846, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8375, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7777777777777779, "eval_TIME_number": 26, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.18319469690322876, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.8256624825662482, "eval_overall_precision": 0.783068783068783, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9355, "eval_samples_per_second": 199.902, "eval_steps_per_second": 3.207, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.720840334892273, "learning_rate": 2.25e-05, "loss": 0.0403, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.8322147651006712, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7471264367816093, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6565656565656566, "eval_ORGANIZATION_recall": 0.8666666666666667, "eval_PERSON_f1": 0.8786885245901639, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8271604938271605, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1950027197599411, "eval_overall_accuracy": 0.9542156617463098, "eval_overall_f1": 0.8147138964577656, "eval_overall_precision": 0.7569620253164557, "eval_overall_recall": 0.8820058997050148, "eval_runtime": 0.9369, "eval_samples_per_second": 199.604, "eval_steps_per_second": 3.202, "step": 5830 }, { "epoch": 56.0, "grad_norm": 0.4839901924133301, "learning_rate": 2.2000000000000003e-05, "loss": 0.0422, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8275862068965517, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.821917808219178, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7439024390243902, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6853932584269663, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8933333333333333, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8535031847133758, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17818213999271393, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.8184357541899441, "eval_overall_precision": 0.7771883289124668, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9337, "eval_samples_per_second": 200.278, "eval_steps_per_second": 3.213, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.7197099924087524, "learning_rate": 2.15e-05, "loss": 0.0394, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8333333333333334, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8333333333333334, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7468354430379747, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7108433734939759, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8896321070234114, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8525641025641025, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17426693439483643, "eval_overall_accuracy": 0.9589692269201902, "eval_overall_f1": 0.8215297450424929, "eval_overall_precision": 0.7901907356948229, "eval_overall_recall": 0.855457227138643, "eval_runtime": 0.9259, "eval_samples_per_second": 201.976, "eval_steps_per_second": 3.24, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.526695191860199, "learning_rate": 2.1e-05, "loss": 0.0409, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8299319727891157, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8133333333333334, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7643312101910827, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7317073170731707, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8874172185430464, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8427672955974843, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.17505142092704773, "eval_overall_accuracy": 0.9567175381536153, "eval_overall_f1": 0.8195804195804196, "eval_overall_precision": 0.7792553191489362, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9256, "eval_samples_per_second": 202.037, "eval_steps_per_second": 3.241, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.38071247935295105, "learning_rate": 2.05e-05, "loss": 0.0384, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7749999999999999, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7294117647058823, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8896321070234114, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8525641025641025, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.75, "eval_TIME_number": 26, "eval_TIME_precision": 0.7, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.17447121441364288, "eval_overall_accuracy": 0.957968476357268, "eval_overall_f1": 0.8228730822873082, "eval_overall_precision": 0.7804232804232805, "eval_overall_recall": 0.8702064896755162, "eval_runtime": 0.9356, "eval_samples_per_second": 199.869, "eval_steps_per_second": 3.206, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.4309019446372986, "learning_rate": 2e-05, "loss": 0.0385, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.8590604026845637, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.8888888888888888, "eval_ORGANIZATION_f1": 0.7757575757575759, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7111111111111111, "eval_ORGANIZATION_recall": 0.8533333333333334, "eval_PERSON_f1": 0.8874172185430464, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8427672955974843, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6428571428571429, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5454545454545454, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.18776963651180267, "eval_overall_accuracy": 0.955716787590693, "eval_overall_f1": 0.8264462809917357, "eval_overall_precision": 0.7751937984496124, "eval_overall_recall": 0.8849557522123894, "eval_runtime": 0.9372, "eval_samples_per_second": 199.53, "eval_steps_per_second": 3.201, "step": 6360 }, { "epoch": 61.0, "grad_norm": 1.0351260900497437, "learning_rate": 1.9500000000000003e-05, "loss": 0.0371, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8309859154929577, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8428571428571429, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.763157894736842, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7532467532467533, "eval_ORGANIZATION_recall": 0.7733333333333333, "eval_PERSON_f1": 0.8778877887788779, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.83125, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.18786616623401642, "eval_overall_accuracy": 0.9562171628721541, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7890410958904109, "eval_overall_recall": 0.8495575221238938, "eval_runtime": 0.9236, "eval_samples_per_second": 202.479, "eval_steps_per_second": 3.248, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.6741280555725098, "learning_rate": 1.9e-05, "loss": 0.0385, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.7972972972972973, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7894736842105264, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7792207792207793, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8940397350993377, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8490566037735849, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.18338263034820557, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8213783403656821, "eval_overall_precision": 0.7849462365591398, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.9302, "eval_samples_per_second": 201.036, "eval_steps_per_second": 3.225, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.2608901560306549, "learning_rate": 1.85e-05, "loss": 0.0359, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.816326530612245, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7777777777777777, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7241379310344828, "eval_ORGANIZATION_recall": 0.84, "eval_PERSON_f1": 0.9084745762711864, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.881578947368421, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6545454545454547, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7017543859649122, "eval_TIME_number": 26, "eval_TIME_precision": 0.6451612903225806, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.18453986942768097, "eval_overall_accuracy": 0.9587190392794596, "eval_overall_f1": 0.8240223463687151, "eval_overall_precision": 0.7824933687002652, "eval_overall_recall": 0.8702064896755162, "eval_runtime": 0.9321, "eval_samples_per_second": 200.623, "eval_steps_per_second": 3.219, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.7726385593414307, "learning_rate": 1.8e-05, "loss": 0.0355, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.816326530612245, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7484662576687117, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6931818181818182, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.881578947368421, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8322981366459627, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20165307819843292, "eval_overall_accuracy": 0.9542156617463098, "eval_overall_f1": 0.812760055478502, "eval_overall_precision": 0.7670157068062827, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.957, "eval_samples_per_second": 195.402, "eval_steps_per_second": 3.135, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.47850877046585083, "learning_rate": 1.75e-05, "loss": 0.0338, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7972972972972973, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7564102564102564, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8903654485049833, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8481012658227848, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1862517148256302, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.8215297450424929, "eval_overall_precision": 0.7901907356948229, "eval_overall_recall": 0.855457227138643, "eval_runtime": 0.9305, "eval_samples_per_second": 200.976, "eval_steps_per_second": 3.224, "step": 6890 }, { "epoch": 66.0, "grad_norm": 1.3503855466842651, "learning_rate": 1.7000000000000003e-05, "loss": 0.0376, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.8219178082191781, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8108108108108109, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7792207792207794, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.759493670886076, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8852459016393444, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5806451612903226, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1855112761259079, "eval_overall_accuracy": 0.9564673505128847, "eval_overall_f1": 0.8218793828892006, "eval_overall_precision": 0.7834224598930482, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9291, "eval_samples_per_second": 201.265, "eval_steps_per_second": 3.229, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.09078435599803925, "learning_rate": 1.65e-05, "loss": 0.0324, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.816326530612245, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7564102564102564, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8675496688741723, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8238993710691824, "eval_PERSON_recall": 0.916083916083916, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5806451612903226, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19535928964614868, "eval_overall_accuracy": 0.9547160370277709, "eval_overall_f1": 0.810126582278481, "eval_overall_precision": 0.7741935483870968, "eval_overall_recall": 0.8495575221238938, "eval_runtime": 0.923, "eval_samples_per_second": 202.594, "eval_steps_per_second": 3.25, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.13197369873523712, "learning_rate": 1.6000000000000003e-05, "loss": 0.0361, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.8299319727891157, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8133333333333334, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7407407407407408, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6896551724137931, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8770764119601329, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8354430379746836, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.6792452830188679, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.2019178867340088, "eval_overall_accuracy": 0.9534650988241181, "eval_overall_f1": 0.8117154811715481, "eval_overall_precision": 0.7698412698412699, "eval_overall_recall": 0.8584070796460177, "eval_runtime": 0.9293, "eval_samples_per_second": 201.226, "eval_steps_per_second": 3.228, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.3539793789386749, "learning_rate": 1.55e-05, "loss": 0.0329, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8243243243243243, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8026315789473685, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7468354430379747, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7108433734939759, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8741721854304637, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8301886792452831, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.72, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1934998482465744, "eval_overall_accuracy": 0.9559669752314236, "eval_overall_f1": 0.8157524613220816, "eval_overall_precision": 0.7795698924731183, "eval_overall_recall": 0.855457227138643, "eval_runtime": 0.9314, "eval_samples_per_second": 200.776, "eval_steps_per_second": 3.221, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.4102155566215515, "learning_rate": 1.5e-05, "loss": 0.0336, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.8590604026845637, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.8888888888888888, "eval_ORGANIZATION_f1": 0.7407407407407408, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6896551724137931, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8844884488448846, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8375, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.72, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.18642878532409668, "eval_overall_accuracy": 0.9582186639979985, "eval_overall_f1": 0.8256624825662482, "eval_overall_precision": 0.783068783068783, "eval_overall_recall": 0.8731563421828908, "eval_runtime": 0.9273, "eval_samples_per_second": 201.662, "eval_steps_per_second": 3.235, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.9542334675788879, "learning_rate": 1.45e-05, "loss": 0.0346, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.8413793103448277, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8356164383561644, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.6987951807228915, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6373626373626373, "eval_ORGANIZATION_recall": 0.7733333333333333, "eval_PERSON_f1": 0.8721311475409836, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.18929119408130646, "eval_overall_accuracy": 0.9549662246685013, "eval_overall_f1": 0.8044382801664355, "eval_overall_precision": 0.7591623036649214, "eval_overall_recall": 0.855457227138643, "eval_runtime": 0.9224, "eval_samples_per_second": 202.728, "eval_steps_per_second": 3.252, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.808494508266449, "learning_rate": 1.4000000000000001e-05, "loss": 0.0312, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.8493150684931507, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7407407407407408, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6896551724137931, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8903654485049833, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8481012658227848, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.5806451612903226, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1959969848394394, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.8212290502793296, "eval_overall_precision": 0.7798408488063661, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9295, "eval_samples_per_second": 201.192, "eval_steps_per_second": 3.228, "step": 7632 }, { "epoch": 73.0, "grad_norm": 1.9524306058883667, "learning_rate": 1.3500000000000001e-05, "loss": 0.0342, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8378378378378377, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7544910179640718, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6847826086956522, "eval_ORGANIZATION_recall": 0.84, "eval_PERSON_f1": 0.8800000000000001, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8407643312101911, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19410043954849243, "eval_overall_accuracy": 0.9554665999499625, "eval_overall_f1": 0.8183079056865463, "eval_overall_precision": 0.7722513089005235, "eval_overall_recall": 0.8702064896755162, "eval_runtime": 1.0344, "eval_samples_per_second": 180.783, "eval_steps_per_second": 2.9, "step": 7738 }, { "epoch": 74.0, "grad_norm": 1.1691898107528687, "learning_rate": 1.3000000000000001e-05, "loss": 0.0319, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.847682119205298, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.8888888888888888, "eval_ORGANIZATION_f1": 0.7701863354037267, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7209302325581395, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8823529411764706, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1930677443742752, "eval_overall_accuracy": 0.9582186639979985, "eval_overall_f1": 0.8236914600550964, "eval_overall_precision": 0.772609819121447, "eval_overall_recall": 0.8820058997050148, "eval_runtime": 0.9301, "eval_samples_per_second": 201.064, "eval_steps_per_second": 3.226, "step": 7844 }, { "epoch": 75.0, "grad_norm": 1.1448065042495728, "learning_rate": 1.25e-05, "loss": 0.0293, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8322147651006712, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7500000000000001, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7058823529411765, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8712871287128713, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.825, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7547169811320754, "eval_TIME_number": 26, "eval_TIME_precision": 0.7407407407407407, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1969723254442215, "eval_overall_accuracy": 0.9552164123092319, "eval_overall_f1": 0.8145048814504882, "eval_overall_precision": 0.7724867724867724, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.934, "eval_samples_per_second": 200.216, "eval_steps_per_second": 3.212, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.8883477449417114, "learning_rate": 1.2e-05, "loss": 0.0311, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.8400000000000001, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.7530864197530864, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7011494252873564, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8823529411764706, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7777777777777779, "eval_TIME_number": 26, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.18665479123592377, "eval_overall_accuracy": 0.9582186639979985, "eval_overall_f1": 0.8243430152143844, "eval_overall_precision": 0.7760416666666666, "eval_overall_recall": 0.8790560471976401, "eval_runtime": 0.9252, "eval_samples_per_second": 202.11, "eval_steps_per_second": 3.242, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.35357949137687683, "learning_rate": 1.1500000000000002e-05, "loss": 0.0299, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8344370860927153, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.7530864197530864, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7011494252873564, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8852459016393444, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19146093726158142, "eval_overall_accuracy": 0.9564673505128847, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7674418604651163, "eval_overall_recall": 0.8761061946902655, "eval_runtime": 0.9261, "eval_samples_per_second": 201.927, "eval_steps_per_second": 3.239, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.7683406472206116, "learning_rate": 1.1000000000000001e-05, "loss": 0.03, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8219178082191781, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8108108108108109, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7354838709677418, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7125, "eval_ORGANIZATION_recall": 0.76, "eval_PERSON_f1": 0.8844884488448846, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8375, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19335182011127472, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.8140845070422535, "eval_overall_precision": 0.7789757412398922, "eval_overall_recall": 0.8525073746312685, "eval_runtime": 0.9288, "eval_samples_per_second": 201.33, "eval_steps_per_second": 3.23, "step": 8268 }, { "epoch": 79.0, "grad_norm": 1.1292208433151245, "learning_rate": 1.05e-05, "loss": 0.0305, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.816326530612245, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7577639751552795, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7093023255813954, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8874172185430464, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8427672955974843, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1943107694387436, "eval_overall_accuracy": 0.9567175381536153, "eval_overall_f1": 0.8172942817294282, "eval_overall_precision": 0.7751322751322751, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9335, "eval_samples_per_second": 200.331, "eval_steps_per_second": 3.214, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.6603876948356628, "learning_rate": 1e-05, "loss": 0.0306, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7945205479452054, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7577639751552795, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7093023255813954, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8823529411764706, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.19313213229179382, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8161559888579387, "eval_overall_precision": 0.7730870712401056, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9289, "eval_samples_per_second": 201.304, "eval_steps_per_second": 3.229, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.466139554977417, "learning_rate": 9.5e-06, "loss": 0.0286, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7866666666666666, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7701863354037267, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7209302325581395, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8758169934640523, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8220858895705522, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19068394601345062, "eval_overall_accuracy": 0.955716787590693, "eval_overall_f1": 0.8138888888888888, "eval_overall_precision": 0.7690288713910761, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9312, "eval_samples_per_second": 200.826, "eval_steps_per_second": 3.222, "step": 8586 }, { "epoch": 82.0, "grad_norm": 0.6404593586921692, "learning_rate": 9e-06, "loss": 0.0283, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8322147651006712, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.725, "eval_ORGANIZATION_recall": 0.7733333333333333, "eval_PERSON_f1": 0.8692810457516339, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8159509202453987, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7142857142857142, "eval_TIME_number": 26, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19274306297302246, "eval_overall_accuracy": 0.957968476357268, "eval_overall_f1": 0.8105849582172702, "eval_overall_precision": 0.7678100263852242, "eval_overall_recall": 0.8584070796460177, "eval_runtime": 0.9998, "eval_samples_per_second": 187.045, "eval_steps_per_second": 3.001, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.17559492588043213, "learning_rate": 8.500000000000002e-06, "loss": 0.0289, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7945205479452054, "eval_LOCATION_recall": 0.8055555555555556, "eval_ORGANIZATION_f1": 0.7500000000000001, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7058823529411765, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8750000000000001, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8260869565217391, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1927793323993683, "eval_overall_accuracy": 0.9564673505128847, "eval_overall_f1": 0.8083916083916084, "eval_overall_precision": 0.7686170212765957, "eval_overall_recall": 0.8525073746312685, "eval_runtime": 0.9268, "eval_samples_per_second": 201.759, "eval_steps_per_second": 3.237, "step": 8798 }, { "epoch": 84.0, "grad_norm": 1.3301130533218384, "learning_rate": 8.000000000000001e-06, "loss": 0.0289, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8082191780821918, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7972972972972973, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7530864197530864, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7011494252873564, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8844884488448846, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8375, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7636363636363636, "eval_TIME_number": 26, "eval_TIME_precision": 0.7241379310344828, "eval_TIME_recall": 0.8076923076923077, "eval_loss": 0.19638177752494812, "eval_overall_accuracy": 0.9572179134350763, "eval_overall_f1": 0.8172942817294282, "eval_overall_precision": 0.7751322751322751, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9332, "eval_samples_per_second": 200.396, "eval_steps_per_second": 3.215, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.19960090517997742, "learning_rate": 7.5e-06, "loss": 0.0283, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8053691275167787, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7564102564102564, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7283950617283951, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8823529411764706, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19612807035446167, "eval_overall_accuracy": 0.9572179134350763, "eval_overall_f1": 0.8145048814504882, "eval_overall_precision": 0.7724867724867724, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.9383, "eval_samples_per_second": 199.303, "eval_steps_per_second": 3.197, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.7677280306816101, "learning_rate": 7.000000000000001e-06, "loss": 0.0279, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7662337662337663, "eval_LOCATION_recall": 0.8194444444444444, "eval_ORGANIZATION_f1": 0.7564102564102564, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7283950617283951, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8786885245901639, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8271604938271605, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20059086382389069, "eval_overall_accuracy": 0.9549662246685013, "eval_overall_f1": 0.8089260808926081, "eval_overall_precision": 0.7671957671957672, "eval_overall_recall": 0.855457227138643, "eval_runtime": 0.9285, "eval_samples_per_second": 201.396, "eval_steps_per_second": 3.231, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.65785813331604, "learning_rate": 6.5000000000000004e-06, "loss": 0.0288, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8053691275167787, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7701863354037267, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7209302325581395, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8758169934640523, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8220858895705522, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20255452394485474, "eval_overall_accuracy": 0.9559669752314236, "eval_overall_f1": 0.8144044321329639, "eval_overall_precision": 0.7676240208877284, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9402, "eval_samples_per_second": 198.885, "eval_steps_per_second": 3.191, "step": 9222 }, { "epoch": 88.0, "grad_norm": 1.4090750217437744, "learning_rate": 6e-06, "loss": 0.0275, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8026315789473685, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7450980392156863, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7307692307692307, "eval_ORGANIZATION_recall": 0.76, "eval_PERSON_f1": 0.8831168831168831, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.951048951048951, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19975264370441437, "eval_overall_accuracy": 0.9569677257943457, "eval_overall_f1": 0.812239221140473, "eval_overall_precision": 0.7684210526315789, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.9248, "eval_samples_per_second": 202.217, "eval_steps_per_second": 3.244, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.6550692319869995, "learning_rate": 5.500000000000001e-06, "loss": 0.0272, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7515151515151515, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.6888888888888889, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8794788273615636, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.823170731707317, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.19843065738677979, "eval_overall_accuracy": 0.9562171628721541, "eval_overall_f1": 0.8159340659340658, "eval_overall_precision": 0.7634961439588689, "eval_overall_recall": 0.8761061946902655, "eval_runtime": 0.9223, "eval_samples_per_second": 202.76, "eval_steps_per_second": 3.253, "step": 9434 }, { "epoch": 90.0, "grad_norm": 1.794690489768982, "learning_rate": 5e-06, "loss": 0.0265, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8275862068965517, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.821917808219178, "eval_LOCATION_recall": 0.8333333333333334, "eval_ORGANIZATION_f1": 0.7770700636942677, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7439024390243902, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8823529411764706, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.9440559440559441, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20021091401576996, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.8223776223776224, "eval_overall_precision": 0.7819148936170213, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9203, "eval_samples_per_second": 203.198, "eval_steps_per_second": 3.26, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.0694357305765152, "learning_rate": 4.5e-06, "loss": 0.0258, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.8187919463087249, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7547169811320756, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8729641693811075, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8170731707317073, "eval_PERSON_recall": 0.9370629370629371, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.1959146112203598, "eval_overall_accuracy": 0.9574681010758068, "eval_overall_f1": 0.812760055478502, "eval_overall_precision": 0.7670157068062827, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9378, "eval_samples_per_second": 199.393, "eval_steps_per_second": 3.199, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.7855161428451538, "learning_rate": 4.000000000000001e-06, "loss": 0.0256, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8344370860927153, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.7625, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7176470588235294, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.868421052631579, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8198757763975155, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20366288721561432, "eval_overall_accuracy": 0.955716787590693, "eval_overall_f1": 0.8166666666666667, "eval_overall_precision": 0.7716535433070866, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9223, "eval_samples_per_second": 202.758, "eval_steps_per_second": 3.253, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.923471212387085, "learning_rate": 3.5000000000000004e-06, "loss": 0.026, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.779874213836478, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7380952380952381, "eval_ORGANIZATION_recall": 0.8266666666666667, "eval_PERSON_f1": 0.8712871287128713, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.825, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7272727272727274, "eval_TIME_number": 26, "eval_TIME_precision": 0.6896551724137931, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20790377259254456, "eval_overall_accuracy": 0.9547160370277709, "eval_overall_f1": 0.8166666666666667, "eval_overall_precision": 0.7716535433070866, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9308, "eval_samples_per_second": 200.901, "eval_steps_per_second": 3.223, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.5129814147949219, "learning_rate": 3e-06, "loss": 0.0269, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7672955974842767, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7261904761904762, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.868421052631579, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8198757763975155, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.2034631371498108, "eval_overall_accuracy": 0.9552164123092319, "eval_overall_f1": 0.8138888888888888, "eval_overall_precision": 0.7690288713910761, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.9303, "eval_samples_per_second": 201.002, "eval_steps_per_second": 3.225, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.9843897819519043, "learning_rate": 2.5e-06, "loss": 0.0254, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7625, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7176470588235294, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8721311475409836, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20722047984600067, "eval_overall_accuracy": 0.9549662246685013, "eval_overall_f1": 0.8144044321329639, "eval_overall_precision": 0.7676240208877284, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9384, "eval_samples_per_second": 199.274, "eval_steps_per_second": 3.197, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.45156100392341614, "learning_rate": 2.0000000000000003e-06, "loss": 0.0255, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.8344370860927153, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.875, "eval_ORGANIZATION_f1": 0.759493670886076, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7228915662650602, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.868421052631579, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8198757763975155, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20072737336158752, "eval_overall_accuracy": 0.9554665999499625, "eval_overall_f1": 0.8150208623087621, "eval_overall_precision": 0.7710526315789473, "eval_overall_recall": 0.8643067846607669, "eval_runtime": 0.93, "eval_samples_per_second": 201.077, "eval_steps_per_second": 3.226, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.905977725982666, "learning_rate": 1.5e-06, "loss": 0.0248, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7612903225806452, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7375, "eval_ORGANIZATION_recall": 0.7866666666666666, "eval_PERSON_f1": 0.8721311475409836, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.201884463429451, "eval_overall_accuracy": 0.955716787590693, "eval_overall_f1": 0.8145048814504882, "eval_overall_precision": 0.7724867724867724, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.9411, "eval_samples_per_second": 198.713, "eval_steps_per_second": 3.188, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.701413631439209, "learning_rate": 1.0000000000000002e-06, "loss": 0.0258, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.759493670886076, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7228915662650602, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.868421052631579, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8198757763975155, "eval_PERSON_recall": 0.9230769230769231, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20242148637771606, "eval_overall_accuracy": 0.9554665999499625, "eval_overall_f1": 0.812239221140473, "eval_overall_precision": 0.7684210526315789, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.9222, "eval_samples_per_second": 202.767, "eval_steps_per_second": 3.253, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.5330938696861267, "learning_rate": 5.000000000000001e-07, "loss": 0.0251, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8611111111111112, "eval_ORGANIZATION_f1": 0.7721518987341773, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7349397590361446, "eval_ORGANIZATION_recall": 0.8133333333333334, "eval_PERSON_f1": 0.8721311475409836, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.2052735686302185, "eval_overall_accuracy": 0.9559669752314236, "eval_overall_f1": 0.8166666666666667, "eval_overall_precision": 0.7716535433070866, "eval_overall_recall": 0.8672566371681416, "eval_runtime": 0.9322, "eval_samples_per_second": 200.61, "eval_steps_per_second": 3.218, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.6201446652412415, "learning_rate": 0.0, "loss": 0.0255, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 72, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8472222222222222, "eval_ORGANIZATION_f1": 0.7643312101910827, "eval_ORGANIZATION_number": 75, "eval_ORGANIZATION_precision": 0.7317073170731707, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8721311475409836, "eval_PERSON_number": 143, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.9300699300699301, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 23, "eval_QUANTITY_precision": 0.6206896551724138, "eval_QUANTITY_recall": 0.782608695652174, "eval_TIME_f1": 0.7407407407407408, "eval_TIME_number": 26, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.7692307692307693, "eval_loss": 0.20351509749889374, "eval_overall_accuracy": 0.9554665999499625, "eval_overall_f1": 0.8133704735376045, "eval_overall_precision": 0.7704485488126649, "eval_overall_recall": 0.8613569321533924, "eval_runtime": 0.9365, "eval_samples_per_second": 199.684, "eval_steps_per_second": 3.203, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5023623771566022.0, "train_loss": 0.07431833881252217, "train_runtime": 1320.4476, "train_samples_per_second": 127.76, "train_steps_per_second": 8.028 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5023623771566022.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }