|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 1.7605067491531372, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9861, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012820512820512822, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.07692307692307693, |
|
"eval_PERSON_recall": 0.006993006993006993, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.5554673075675964, |
|
"eval_overall_accuracy": 0.8468851638729047, |
|
"eval_overall_f1": 0.0055248618784530384, |
|
"eval_overall_precision": 0.043478260869565216, |
|
"eval_overall_recall": 0.0029498525073746312, |
|
"eval_runtime": 0.9128, |
|
"eval_samples_per_second": 204.873, |
|
"eval_steps_per_second": 3.287, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.7613551616668701, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.5078, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.2150537634408602, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.47619047619047616, |
|
"eval_LOCATION_recall": 0.1388888888888889, |
|
"eval_ORGANIZATION_f1": 0.019417475728155338, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.03571428571428571, |
|
"eval_ORGANIZATION_recall": 0.013333333333333334, |
|
"eval_PERSON_f1": 0.6392961876832844, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.5505050505050505, |
|
"eval_PERSON_recall": 0.7622377622377622, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.6206896551724138, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.5625, |
|
"eval_TIME_recall": 0.6923076923076923, |
|
"eval_loss": 0.3412609398365021, |
|
"eval_overall_accuracy": 0.8961721290968226, |
|
"eval_overall_f1": 0.43740095087163233, |
|
"eval_overall_precision": 0.4726027397260274, |
|
"eval_overall_recall": 0.40707964601769914, |
|
"eval_runtime": 0.9577, |
|
"eval_samples_per_second": 195.257, |
|
"eval_steps_per_second": 3.132, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.2087492942810059, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.3115, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.5696969696969698, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.5053763440860215, |
|
"eval_LOCATION_recall": 0.6527777777777778, |
|
"eval_ORGANIZATION_f1": 0.5125628140703519, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.4112903225806452, |
|
"eval_ORGANIZATION_recall": 0.68, |
|
"eval_PERSON_f1": 0.8231511254019294, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.7619047619047619, |
|
"eval_PERSON_recall": 0.8951048951048951, |
|
"eval_QUANTITY_f1": 0.4590163934426229, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.3684210526315789, |
|
"eval_QUANTITY_recall": 0.6086956521739131, |
|
"eval_TIME_f1": 0.7777777777777779, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.22766432166099548, |
|
"eval_overall_accuracy": 0.9256942707030272, |
|
"eval_overall_f1": 0.6607594936708862, |
|
"eval_overall_precision": 0.5787139689578714, |
|
"eval_overall_recall": 0.7699115044247787, |
|
"eval_runtime": 0.9809, |
|
"eval_samples_per_second": 190.638, |
|
"eval_steps_per_second": 3.058, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 0.9383460283279419, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2203, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.6993865030674847, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.6263736263736264, |
|
"eval_LOCATION_recall": 0.7916666666666666, |
|
"eval_ORGANIZATION_f1": 0.6162790697674418, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.5463917525773195, |
|
"eval_ORGANIZATION_recall": 0.7066666666666667, |
|
"eval_PERSON_f1": 0.8498402555910544, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.7823529411764706, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.410958904109589, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.3, |
|
"eval_QUANTITY_recall": 0.6521739130434783, |
|
"eval_TIME_f1": 0.7419354838709676, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6388888888888888, |
|
"eval_TIME_recall": 0.8846153846153846, |
|
"eval_loss": 0.21552342176437378, |
|
"eval_overall_accuracy": 0.9316987740805605, |
|
"eval_overall_f1": 0.7177522349936143, |
|
"eval_overall_precision": 0.6328828828828829, |
|
"eval_overall_recall": 0.8289085545722714, |
|
"eval_runtime": 0.9352, |
|
"eval_samples_per_second": 199.955, |
|
"eval_steps_per_second": 3.208, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 2.1988296508789062, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1816, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.7516778523489932, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7272727272727273, |
|
"eval_LOCATION_recall": 0.7777777777777778, |
|
"eval_ORGANIZATION_f1": 0.6553672316384181, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.5686274509803921, |
|
"eval_ORGANIZATION_recall": 0.7733333333333333, |
|
"eval_PERSON_f1": 0.8794788273615636, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.823170731707317, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7142857142857143, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6060606060606061, |
|
"eval_QUANTITY_recall": 0.8695652173913043, |
|
"eval_TIME_f1": 0.9230769230769231, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.9230769230769231, |
|
"eval_loss": 0.15413647890090942, |
|
"eval_overall_accuracy": 0.9489617212909682, |
|
"eval_overall_f1": 0.7908232118758435, |
|
"eval_overall_precision": 0.7288557213930348, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9063, |
|
"eval_samples_per_second": 206.339, |
|
"eval_steps_per_second": 3.31, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 0.9543836116790771, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1655, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7317073170731708, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.6521739130434783, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7078651685393258, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6116504854368932, |
|
"eval_ORGANIZATION_recall": 0.84, |
|
"eval_PERSON_f1": 0.8918032786885245, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.951048951048951, |
|
"eval_QUANTITY_f1": 0.6909090909090908, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.59375, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7241379310344829, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.65625, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.15523788332939148, |
|
"eval_overall_accuracy": 0.9504628471353516, |
|
"eval_overall_f1": 0.7868421052631579, |
|
"eval_overall_precision": 0.7102137767220903, |
|
"eval_overall_recall": 0.8820058997050148, |
|
"eval_runtime": 0.9116, |
|
"eval_samples_per_second": 205.138, |
|
"eval_steps_per_second": 3.291, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.4434598982334137, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1513, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7631578947368423, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7111111111111111, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6095238095238096, |
|
"eval_ORGANIZATION_recall": 0.8533333333333334, |
|
"eval_PERSON_f1": 0.8758169934640523, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8220858895705522, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7017543859649124, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5882352941176471, |
|
"eval_QUANTITY_recall": 0.8695652173913043, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.14643213152885437, |
|
"eval_overall_accuracy": 0.952964723542657, |
|
"eval_overall_f1": 0.7882822902796273, |
|
"eval_overall_precision": 0.7184466019417476, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9227, |
|
"eval_samples_per_second": 202.669, |
|
"eval_steps_per_second": 3.251, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.7223401069641113, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1403, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7215189873417721, |
|
"eval_LOCATION_recall": 0.7916666666666666, |
|
"eval_ORGANIZATION_f1": 0.7093023255813953, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6288659793814433, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8829431438127091, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8461538461538461, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.8695652173913043, |
|
"eval_TIME_f1": 0.6779661016949152, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6060606060606061, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.14050298929214478, |
|
"eval_overall_accuracy": 0.9542156617463098, |
|
"eval_overall_f1": 0.7880434782608694, |
|
"eval_overall_precision": 0.7304785894206549, |
|
"eval_overall_recall": 0.855457227138643, |
|
"eval_runtime": 0.9407, |
|
"eval_samples_per_second": 198.786, |
|
"eval_steps_per_second": 3.189, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.0728905200958252, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.138, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.711864406779661, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6176470588235294, |
|
"eval_ORGANIZATION_recall": 0.84, |
|
"eval_PERSON_f1": 0.9066666666666667, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8662420382165605, |
|
"eval_PERSON_recall": 0.951048951048951, |
|
"eval_QUANTITY_f1": 0.7169811320754716, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6333333333333333, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.14766837656497955, |
|
"eval_overall_accuracy": 0.9527145359019265, |
|
"eval_overall_f1": 0.814111261872456, |
|
"eval_overall_precision": 0.7537688442211056, |
|
"eval_overall_recall": 0.8849557522123894, |
|
"eval_runtime": 0.9393, |
|
"eval_samples_per_second": 199.079, |
|
"eval_steps_per_second": 3.194, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 2.3210840225219727, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1301, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7349397590361445, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6703296703296703, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8940397350993377, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8490566037735849, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5588235294117647, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.13562895357608795, |
|
"eval_overall_accuracy": 0.9564673505128847, |
|
"eval_overall_f1": 0.8098495212038302, |
|
"eval_overall_precision": 0.7551020408163265, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9309, |
|
"eval_samples_per_second": 200.881, |
|
"eval_steps_per_second": 3.223, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.8354237675666809, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.12, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7733333333333334, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7682926829268292, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7078651685393258, |
|
"eval_ORGANIZATION_recall": 0.84, |
|
"eval_PERSON_f1": 0.8926174496644295, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8580645161290322, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.7037037037037037, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6129032258064516, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.12984243035316467, |
|
"eval_overall_accuracy": 0.9587190392794596, |
|
"eval_overall_f1": 0.8155339805825244, |
|
"eval_overall_precision": 0.7696335078534031, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9242, |
|
"eval_samples_per_second": 202.333, |
|
"eval_steps_per_second": 3.246, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 2.3830783367156982, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1171, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.7945205479452055, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7837837837837838, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7195121951219511, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6629213483146067, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8844884488448846, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8375, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6428571428571429, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5454545454545454, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.8461538461538461, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.8461538461538461, |
|
"eval_TIME_recall": 0.8461538461538461, |
|
"eval_loss": 0.13061821460723877, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8072122052704578, |
|
"eval_overall_precision": 0.7617801047120419, |
|
"eval_overall_recall": 0.8584070796460177, |
|
"eval_runtime": 0.9196, |
|
"eval_samples_per_second": 203.355, |
|
"eval_steps_per_second": 3.262, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.5705311894416809, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1129, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.781456953642384, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7597765363128492, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6538461538461539, |
|
"eval_ORGANIZATION_recall": 0.9066666666666666, |
|
"eval_PERSON_f1": 0.8940397350993377, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8490566037735849, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7142857142857143, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6060606060606061, |
|
"eval_QUANTITY_recall": 0.8695652173913043, |
|
"eval_TIME_f1": 0.7857142857142856, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7333333333333333, |
|
"eval_TIME_recall": 0.8461538461538461, |
|
"eval_loss": 0.13694216310977936, |
|
"eval_overall_accuracy": 0.9564673505128847, |
|
"eval_overall_f1": 0.8172043010752689, |
|
"eval_overall_precision": 0.7506172839506173, |
|
"eval_overall_recall": 0.8967551622418879, |
|
"eval_runtime": 0.9213, |
|
"eval_samples_per_second": 202.983, |
|
"eval_steps_per_second": 3.256, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.2299761772155762, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1076, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7919463087248323, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7662337662337663, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7613636363636365, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6633663366336634, |
|
"eval_ORGANIZATION_recall": 0.8933333333333333, |
|
"eval_PERSON_f1": 0.8910891089108911, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.84375, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6206896551724138, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5142857142857142, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7241379310344829, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.65625, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.1426171064376831, |
|
"eval_overall_accuracy": 0.9524643482611959, |
|
"eval_overall_f1": 0.8064516129032259, |
|
"eval_overall_precision": 0.7407407407407407, |
|
"eval_overall_recall": 0.8849557522123894, |
|
"eval_runtime": 0.9372, |
|
"eval_samples_per_second": 199.528, |
|
"eval_steps_per_second": 3.201, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 0.628875732421875, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1056, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.8082191780821918, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7972972972972973, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7674418604651163, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6804123711340206, |
|
"eval_ORGANIZATION_recall": 0.88, |
|
"eval_PERSON_f1": 0.8859060402684563, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8516129032258064, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.6181818181818182, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.53125, |
|
"eval_QUANTITY_recall": 0.7391304347826086, |
|
"eval_TIME_f1": 0.8214285714285715, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7666666666666667, |
|
"eval_TIME_recall": 0.8846153846153846, |
|
"eval_loss": 0.1336900293827057, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.8170563961485556, |
|
"eval_overall_precision": 0.7654639175257731, |
|
"eval_overall_recall": 0.8761061946902655, |
|
"eval_runtime": 0.9357, |
|
"eval_samples_per_second": 199.851, |
|
"eval_steps_per_second": 3.206, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.9760724902153015, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1003, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7657142857142857, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.67, |
|
"eval_ORGANIZATION_recall": 0.8933333333333333, |
|
"eval_PERSON_f1": 0.8963210702341137, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8589743589743589, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6785714285714286, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5757575757575758, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.145399808883667, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8206521739130435, |
|
"eval_overall_precision": 0.760705289672544, |
|
"eval_overall_recall": 0.8908554572271387, |
|
"eval_runtime": 0.9425, |
|
"eval_samples_per_second": 198.413, |
|
"eval_steps_per_second": 3.183, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.18460078537464142, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0997, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7602339181286549, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6770833333333334, |
|
"eval_ORGANIZATION_recall": 0.8666666666666667, |
|
"eval_PERSON_f1": 0.8851351351351351, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8562091503267973, |
|
"eval_PERSON_recall": 0.916083916083916, |
|
"eval_QUANTITY_f1": 0.6428571428571429, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5454545454545454, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1395619809627533, |
|
"eval_overall_accuracy": 0.955716787590693, |
|
"eval_overall_f1": 0.8076923076923076, |
|
"eval_overall_precision": 0.7557840616966581, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.923, |
|
"eval_samples_per_second": 202.596, |
|
"eval_steps_per_second": 3.25, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.43792226910591125, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0956, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8169014084507044, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8285714285714286, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.726190476190476, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6559139784946236, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8926174496644295, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8580645161290322, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6909090909090908, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.59375, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.13341191411018372, |
|
"eval_overall_accuracy": 0.9587190392794596, |
|
"eval_overall_f1": 0.8133704735376045, |
|
"eval_overall_precision": 0.7704485488126649, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.9563, |
|
"eval_samples_per_second": 195.551, |
|
"eval_steps_per_second": 3.137, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.8807380795478821, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0906, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7945205479452054, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7542857142857142, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.66, |
|
"eval_ORGANIZATION_recall": 0.88, |
|
"eval_PERSON_f1": 0.8926174496644295, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8580645161290322, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6428571428571429, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5454545454545454, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.13378730416297913, |
|
"eval_overall_accuracy": 0.9572179134350763, |
|
"eval_overall_f1": 0.8120713305898491, |
|
"eval_overall_precision": 0.7589743589743589, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9383, |
|
"eval_samples_per_second": 199.303, |
|
"eval_steps_per_second": 3.197, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.726658046245575, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0876, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8187919463087249, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7922077922077922, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7727272727272727, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6732673267326733, |
|
"eval_ORGANIZATION_recall": 0.9066666666666666, |
|
"eval_PERSON_f1": 0.881578947368421, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8322981366459627, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6909090909090908, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.59375, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.1531873345375061, |
|
"eval_overall_accuracy": 0.9564673505128847, |
|
"eval_overall_f1": 0.8200270635994586, |
|
"eval_overall_precision": 0.7575, |
|
"eval_overall_recall": 0.8938053097345132, |
|
"eval_runtime": 0.9428, |
|
"eval_samples_per_second": 198.355, |
|
"eval_steps_per_second": 3.182, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 1.286189317703247, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0841, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7560975609756098, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6966292134831461, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8866666666666668, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8471337579617835, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6428571428571429, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5454545454545454, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.1474735289812088, |
|
"eval_overall_accuracy": 0.9567175381536153, |
|
"eval_overall_f1": 0.8126721763085399, |
|
"eval_overall_precision": 0.7622739018087855, |
|
"eval_overall_recall": 0.8702064896755162, |
|
"eval_runtime": 0.9368, |
|
"eval_samples_per_second": 199.611, |
|
"eval_steps_per_second": 3.202, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.40452536940574646, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0842, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7861271676300577, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6938775510204082, |
|
"eval_ORGANIZATION_recall": 0.9066666666666666, |
|
"eval_PERSON_f1": 0.8970099667774087, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8544303797468354, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6428571428571429, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5454545454545454, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.13896140456199646, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.8228882833787466, |
|
"eval_overall_precision": 0.7645569620253164, |
|
"eval_overall_recall": 0.8908554572271387, |
|
"eval_runtime": 0.9322, |
|
"eval_samples_per_second": 200.611, |
|
"eval_steps_per_second": 3.218, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.6667360663414001, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0798, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.7945205479452055, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7837837837837838, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7666666666666667, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.92, |
|
"eval_PERSON_f1": 0.8933333333333333, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8535031847133758, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.631578947368421, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5294117647058824, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7777777777777779, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.15068964660167694, |
|
"eval_overall_accuracy": 0.9542156617463098, |
|
"eval_overall_f1": 0.814111261872456, |
|
"eval_overall_precision": 0.7537688442211056, |
|
"eval_overall_recall": 0.8849557522123894, |
|
"eval_runtime": 1.0035, |
|
"eval_samples_per_second": 186.346, |
|
"eval_steps_per_second": 2.99, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 0.6917049884796143, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0775, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.8108108108108109, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7894736842105263, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7721518987341773, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7349397590361446, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8970099667774087, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8544303797468354, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7692307692307693, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6896551724137931, |
|
"eval_QUANTITY_recall": 0.8695652173913043, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.14417295157909393, |
|
"eval_overall_accuracy": 0.9604703527645734, |
|
"eval_overall_f1": 0.8319327731092437, |
|
"eval_overall_precision": 0.792, |
|
"eval_overall_recall": 0.8761061946902655, |
|
"eval_runtime": 0.9311, |
|
"eval_samples_per_second": 200.829, |
|
"eval_steps_per_second": 3.222, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.38176143169403076, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0759, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8322147651006712, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.783625730994152, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6979166666666666, |
|
"eval_ORGANIZATION_recall": 0.8933333333333333, |
|
"eval_PERSON_f1": 0.8963210702341137, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8589743589743589, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6440677966101694, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5277777777777778, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7368421052631579, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6774193548387096, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.14586655795574188, |
|
"eval_overall_accuracy": 0.9582186639979985, |
|
"eval_overall_f1": 0.8244897959183674, |
|
"eval_overall_precision": 0.7651515151515151, |
|
"eval_overall_recall": 0.8938053097345132, |
|
"eval_runtime": 0.9333, |
|
"eval_samples_per_second": 200.36, |
|
"eval_steps_per_second": 3.214, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.690096914768219, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0731, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7945205479452054, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7975460122699386, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7386363636363636, |
|
"eval_ORGANIZATION_recall": 0.8666666666666667, |
|
"eval_PERSON_f1": 0.8940397350993377, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8490566037735849, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7169811320754716, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6333333333333333, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7777777777777779, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.151327446103096, |
|
"eval_overall_accuracy": 0.9587190392794596, |
|
"eval_overall_f1": 0.8312412831241284, |
|
"eval_overall_precision": 0.7883597883597884, |
|
"eval_overall_recall": 0.8790560471976401, |
|
"eval_runtime": 0.9254, |
|
"eval_samples_per_second": 202.071, |
|
"eval_steps_per_second": 3.242, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.562192440032959, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0714, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7891156462585034, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7733333333333333, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7654320987654321, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7126436781609196, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8903654485049833, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8481012658227848, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.76, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.7037037037037037, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.15548019111156464, |
|
"eval_overall_accuracy": 0.9577182887165374, |
|
"eval_overall_f1": 0.8207282913165266, |
|
"eval_overall_precision": 0.7813333333333333, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9366, |
|
"eval_samples_per_second": 199.663, |
|
"eval_steps_per_second": 3.203, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 1.1344366073608398, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0697, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.7808219178082192, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7702702702702703, |
|
"eval_LOCATION_recall": 0.7916666666666666, |
|
"eval_ORGANIZATION_f1": 0.7607361963190183, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7045454545454546, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8993288590604027, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.864516129032258, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7450980392156864, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6785714285714286, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.14587517082691193, |
|
"eval_overall_accuracy": 0.9587190392794596, |
|
"eval_overall_f1": 0.8202247191011236, |
|
"eval_overall_precision": 0.7828418230563002, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.92, |
|
"eval_samples_per_second": 203.25, |
|
"eval_steps_per_second": 3.261, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.7924529910087585, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0701, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8356164383561645, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8243243243243243, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7176470588235295, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6421052631578947, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8986486486486487, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.869281045751634, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.5862068965517241, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.4857142857142857, |
|
"eval_QUANTITY_recall": 0.7391304347826086, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1690864861011505, |
|
"eval_overall_accuracy": 0.9532149111833875, |
|
"eval_overall_f1": 0.8055172413793102, |
|
"eval_overall_precision": 0.7564766839378239, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.929, |
|
"eval_samples_per_second": 201.295, |
|
"eval_steps_per_second": 3.229, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 1.1464416980743408, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0678, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8251748251748252, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8309859154929577, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7484662576687117, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6931818181818182, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8963210702341137, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8589743589743589, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7450980392156864, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6785714285714286, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7857142857142856, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7333333333333333, |
|
"eval_TIME_recall": 0.8461538461538461, |
|
"eval_loss": 0.14405371248722076, |
|
"eval_overall_accuracy": 0.9582186639979985, |
|
"eval_overall_f1": 0.8286516853932584, |
|
"eval_overall_precision": 0.7908847184986595, |
|
"eval_overall_recall": 0.8702064896755162, |
|
"eval_runtime": 1.0504, |
|
"eval_samples_per_second": 178.034, |
|
"eval_steps_per_second": 2.856, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.38195714354515076, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0658, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8322147651006712, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7861271676300577, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6938775510204082, |
|
"eval_ORGANIZATION_recall": 0.9066666666666666, |
|
"eval_PERSON_f1": 0.8993288590604027, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.864516129032258, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7755102040816326, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.7307692307692307, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.15743257105350494, |
|
"eval_overall_accuracy": 0.9584688516387291, |
|
"eval_overall_f1": 0.8381742738589212, |
|
"eval_overall_precision": 0.7890625, |
|
"eval_overall_recall": 0.8938053097345132, |
|
"eval_runtime": 0.9177, |
|
"eval_samples_per_second": 203.771, |
|
"eval_steps_per_second": 3.269, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.8308860659599304, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0648, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8428571428571429, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8676470588235294, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7619047619047621, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6881720430107527, |
|
"eval_ORGANIZATION_recall": 0.8533333333333334, |
|
"eval_PERSON_f1": 0.9016949152542374, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.7169811320754716, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6333333333333333, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7586206896551724, |
|
"eval_TIME_recall": 0.8461538461538461, |
|
"eval_loss": 0.1516529768705368, |
|
"eval_overall_accuracy": 0.9597197898423818, |
|
"eval_overall_f1": 0.8354430379746836, |
|
"eval_overall_precision": 0.7983870967741935, |
|
"eval_overall_recall": 0.8761061946902655, |
|
"eval_runtime": 1.0211, |
|
"eval_samples_per_second": 183.135, |
|
"eval_steps_per_second": 2.938, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.37685203552246094, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0626, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.7945205479452055, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7837837837837838, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7810650887573964, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7021276595744681, |
|
"eval_ORGANIZATION_recall": 0.88, |
|
"eval_PERSON_f1": 0.9016949152542374, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.15304860472679138, |
|
"eval_overall_accuracy": 0.9584688516387291, |
|
"eval_overall_f1": 0.82336578581363, |
|
"eval_overall_precision": 0.7789473684210526, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9446, |
|
"eval_samples_per_second": 197.961, |
|
"eval_steps_per_second": 3.176, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.1034225225448608, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0631, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8378378378378377, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7953216374269007, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7083333333333334, |
|
"eval_ORGANIZATION_recall": 0.9066666666666666, |
|
"eval_PERSON_f1": 0.903010033444816, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8653846153846154, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6545454545454547, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5625, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7241379310344829, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.65625, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.16854536533355713, |
|
"eval_overall_accuracy": 0.9572179134350763, |
|
"eval_overall_f1": 0.8317373461012312, |
|
"eval_overall_precision": 0.7755102040816326, |
|
"eval_overall_recall": 0.8967551622418879, |
|
"eval_runtime": 0.937, |
|
"eval_samples_per_second": 199.569, |
|
"eval_steps_per_second": 3.202, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 1.6754740476608276, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0598, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8707482993197277, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8533333333333334, |
|
"eval_LOCATION_recall": 0.8888888888888888, |
|
"eval_ORGANIZATION_f1": 0.7784431137724551, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7065217391304348, |
|
"eval_ORGANIZATION_recall": 0.8666666666666667, |
|
"eval_PERSON_f1": 0.8986486486486487, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.869281045751634, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.631578947368421, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5294117647058824, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1640816181898117, |
|
"eval_overall_accuracy": 0.957968476357268, |
|
"eval_overall_f1": 0.8333333333333335, |
|
"eval_overall_precision": 0.7874015748031497, |
|
"eval_overall_recall": 0.8849557522123894, |
|
"eval_runtime": 0.9325, |
|
"eval_samples_per_second": 200.545, |
|
"eval_steps_per_second": 3.217, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.5667424201965332, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.06, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8053691275167787, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7792207792207793, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7738095238095238, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6989247311827957, |
|
"eval_ORGANIZATION_recall": 0.8666666666666667, |
|
"eval_PERSON_f1": 0.8963210702341137, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8589743589743589, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7346938775510203, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.1585589498281479, |
|
"eval_overall_accuracy": 0.9589692269201902, |
|
"eval_overall_f1": 0.826629680998613, |
|
"eval_overall_precision": 0.7801047120418848, |
|
"eval_overall_recall": 0.8790560471976401, |
|
"eval_runtime": 0.9262, |
|
"eval_samples_per_second": 201.894, |
|
"eval_steps_per_second": 3.239, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 2.2813751697540283, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0564, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.8322147651006712, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7701149425287357, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6767676767676768, |
|
"eval_ORGANIZATION_recall": 0.8933333333333333, |
|
"eval_PERSON_f1": 0.8993288590604027, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.864516129032258, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.16692771017551422, |
|
"eval_overall_accuracy": 0.9594696022016512, |
|
"eval_overall_f1": 0.8296703296703297, |
|
"eval_overall_precision": 0.7763496143958869, |
|
"eval_overall_recall": 0.8908554572271387, |
|
"eval_runtime": 0.9304, |
|
"eval_samples_per_second": 200.987, |
|
"eval_steps_per_second": 3.224, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 1.5005148649215698, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0583, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8169014084507044, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8285714285714286, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7721518987341773, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7349397590361446, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.9090909090909092, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8766233766233766, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.72, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7924528301886792, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7777777777777778, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.15361984074115753, |
|
"eval_overall_accuracy": 0.960720540405304, |
|
"eval_overall_f1": 0.8371428571428572, |
|
"eval_overall_precision": 0.8116343490304709, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9285, |
|
"eval_samples_per_second": 201.402, |
|
"eval_steps_per_second": 3.231, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.37653887271881104, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0545, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.8111888111888113, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8169014084507042, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7647058823529413, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6842105263157895, |
|
"eval_ORGANIZATION_recall": 0.8666666666666667, |
|
"eval_PERSON_f1": 0.9, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8598726114649682, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7307692307692308, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6551724137931034, |
|
"eval_QUANTITY_recall": 0.8260869565217391, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.16966940462589264, |
|
"eval_overall_accuracy": 0.957968476357268, |
|
"eval_overall_f1": 0.8261474269819195, |
|
"eval_overall_precision": 0.781578947368421, |
|
"eval_overall_recall": 0.8761061946902655, |
|
"eval_runtime": 0.9372, |
|
"eval_samples_per_second": 199.533, |
|
"eval_steps_per_second": 3.201, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 1.0764912366867065, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0555, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.7784431137724551, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7065217391304348, |
|
"eval_ORGANIZATION_recall": 0.8666666666666667, |
|
"eval_PERSON_f1": 0.8963210702341137, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8589743589743589, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.6896551724137931, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.625, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.16699136793613434, |
|
"eval_overall_accuracy": 0.9587190392794596, |
|
"eval_overall_f1": 0.8275862068965517, |
|
"eval_overall_precision": 0.7772020725388601, |
|
"eval_overall_recall": 0.8849557522123894, |
|
"eval_runtime": 0.9355, |
|
"eval_samples_per_second": 199.887, |
|
"eval_steps_per_second": 3.207, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 1.2565559148788452, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0536, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.8513513513513513, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.7928994082840236, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7127659574468085, |
|
"eval_ORGANIZATION_recall": 0.8933333333333333, |
|
"eval_PERSON_f1": 0.8963210702341137, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8589743589743589, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.72, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7368421052631579, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6774193548387096, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.16643501818180084, |
|
"eval_overall_accuracy": 0.9599699774831123, |
|
"eval_overall_f1": 0.8381742738589212, |
|
"eval_overall_precision": 0.7890625, |
|
"eval_overall_recall": 0.8938053097345132, |
|
"eval_runtime": 0.9907, |
|
"eval_samples_per_second": 188.749, |
|
"eval_steps_per_second": 3.028, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.8656229376792908, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0528, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8827586206896552, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8767123287671232, |
|
"eval_LOCATION_recall": 0.8888888888888888, |
|
"eval_ORGANIZATION_f1": 0.7607361963190183, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7045454545454546, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.903010033444816, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8653846153846154, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6206896551724138, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5142857142857142, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1719001978635788, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8305555555555555, |
|
"eval_overall_precision": 0.7847769028871391, |
|
"eval_overall_recall": 0.8820058997050148, |
|
"eval_runtime": 0.9302, |
|
"eval_samples_per_second": 201.029, |
|
"eval_steps_per_second": 3.225, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.4717106819152832, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0505, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.8413793103448277, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8356164383561644, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7469879518072289, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6813186813186813, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8926174496644295, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8580645161290322, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6428571428571429, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5454545454545454, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1703517884016037, |
|
"eval_overall_accuracy": 0.9552164123092319, |
|
"eval_overall_f1": 0.8166666666666667, |
|
"eval_overall_precision": 0.7716535433070866, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9281, |
|
"eval_samples_per_second": 201.476, |
|
"eval_steps_per_second": 3.232, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.6283421516418457, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.05, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8053691275167787, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7792207792207793, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7607361963190183, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7045454545454546, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.903010033444816, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8653846153846154, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.16587650775909424, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8205841446453408, |
|
"eval_overall_precision": 0.7763157894736842, |
|
"eval_overall_recall": 0.8702064896755162, |
|
"eval_runtime": 0.933, |
|
"eval_samples_per_second": 200.427, |
|
"eval_steps_per_second": 3.215, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 0.7488293051719666, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0515, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.759493670886076, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7228915662650602, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8874172185430464, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8427672955974843, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.631578947368421, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5294117647058824, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17817422747612, |
|
"eval_overall_accuracy": 0.9544658493870403, |
|
"eval_overall_f1": 0.8223776223776224, |
|
"eval_overall_precision": 0.7819148936170213, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9321, |
|
"eval_samples_per_second": 200.616, |
|
"eval_steps_per_second": 3.218, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.3455760180950165, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0484, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8356164383561645, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8243243243243243, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7672955974842767, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7261904761904762, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8750000000000001, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8260869565217391, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1757228672504425, |
|
"eval_overall_accuracy": 0.9549662246685013, |
|
"eval_overall_f1": 0.8195804195804196, |
|
"eval_overall_precision": 0.7792553191489362, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9328, |
|
"eval_samples_per_second": 200.479, |
|
"eval_steps_per_second": 3.216, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.9659437537193298, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0477, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8413793103448277, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8356164383561644, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7547169811320756, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7142857142857143, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8844884488448846, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8375, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6545454545454547, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5625, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17942465841770172, |
|
"eval_overall_accuracy": 0.9549662246685013, |
|
"eval_overall_f1": 0.8172942817294282, |
|
"eval_overall_precision": 0.7751322751322751, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9384, |
|
"eval_samples_per_second": 199.28, |
|
"eval_steps_per_second": 3.197, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 0.39018484950065613, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0456, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8472222222222222, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8472222222222222, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.779874213836478, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7380952380952381, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.9060402684563759, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8709677419354839, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.16816405951976776, |
|
"eval_overall_accuracy": 0.9609707280460346, |
|
"eval_overall_f1": 0.8373408769448375, |
|
"eval_overall_precision": 0.8043478260869565, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9286, |
|
"eval_samples_per_second": 201.387, |
|
"eval_steps_per_second": 3.231, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.4282808303833008, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0458, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.863013698630137, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.7052023121387283, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6224489795918368, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8903654485049833, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8481012658227848, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6545454545454547, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5625, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.18153227865695953, |
|
"eval_overall_accuracy": 0.9547160370277709, |
|
"eval_overall_f1": 0.8131868131868133, |
|
"eval_overall_precision": 0.7609254498714653, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.927, |
|
"eval_samples_per_second": 201.727, |
|
"eval_steps_per_second": 3.236, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.5775999426841736, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0449, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.728395061728395, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6781609195402298, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.9054054054054055, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8758169934640523, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5806451612903226, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17358513176441193, |
|
"eval_overall_accuracy": 0.9577182887165374, |
|
"eval_overall_f1": 0.8223776223776224, |
|
"eval_overall_precision": 0.7819148936170213, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9332, |
|
"eval_samples_per_second": 200.395, |
|
"eval_steps_per_second": 3.215, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.8392077684402466, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0443, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.8378378378378377, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7636363636363636, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.84, |
|
"eval_PERSON_f1": 0.8721311475409836, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17768125236034393, |
|
"eval_overall_accuracy": 0.9572179134350763, |
|
"eval_overall_f1": 0.8188105117565698, |
|
"eval_overall_precision": 0.7708333333333334, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9419, |
|
"eval_samples_per_second": 198.534, |
|
"eval_steps_per_second": 3.185, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.5880552530288696, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.044, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8648648648648649, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.8888888888888888, |
|
"eval_ORGANIZATION_f1": 0.7484662576687117, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6931818181818182, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.9023569023569024, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8701298701298701, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17750605940818787, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8296089385474861, |
|
"eval_overall_precision": 0.7877984084880637, |
|
"eval_overall_recall": 0.8761061946902655, |
|
"eval_runtime": 0.9391, |
|
"eval_samples_per_second": 199.121, |
|
"eval_steps_per_second": 3.194, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.7479882836341858, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0436, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.8648648648648649, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.8888888888888888, |
|
"eval_ORGANIZATION_f1": 0.7469879518072289, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6813186813186813, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8933333333333333, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8535031847133758, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6545454545454547, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5625, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17619207501411438, |
|
"eval_overall_accuracy": 0.9572179134350763, |
|
"eval_overall_f1": 0.8220689655172414, |
|
"eval_overall_precision": 0.772020725388601, |
|
"eval_overall_recall": 0.8790560471976401, |
|
"eval_runtime": 0.9329, |
|
"eval_samples_per_second": 200.454, |
|
"eval_steps_per_second": 3.216, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.6151536703109741, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0416, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7393939393939395, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6777777777777778, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8844884488448846, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8375, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7777777777777779, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.18319469690322876, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.8256624825662482, |
|
"eval_overall_precision": 0.783068783068783, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9355, |
|
"eval_samples_per_second": 199.902, |
|
"eval_steps_per_second": 3.207, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.720840334892273, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0403, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8322147651006712, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7471264367816093, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6565656565656566, |
|
"eval_ORGANIZATION_recall": 0.8666666666666667, |
|
"eval_PERSON_f1": 0.8786885245901639, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8271604938271605, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1950027197599411, |
|
"eval_overall_accuracy": 0.9542156617463098, |
|
"eval_overall_f1": 0.8147138964577656, |
|
"eval_overall_precision": 0.7569620253164557, |
|
"eval_overall_recall": 0.8820058997050148, |
|
"eval_runtime": 0.9369, |
|
"eval_samples_per_second": 199.604, |
|
"eval_steps_per_second": 3.202, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.4839901924133301, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0422, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8275862068965517, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.821917808219178, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7439024390243902, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6853932584269663, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8933333333333333, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8535031847133758, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17818213999271393, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.8184357541899441, |
|
"eval_overall_precision": 0.7771883289124668, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9337, |
|
"eval_samples_per_second": 200.278, |
|
"eval_steps_per_second": 3.213, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.7197099924087524, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0394, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8333333333333334, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8333333333333334, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7468354430379747, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7108433734939759, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8896321070234114, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8525641025641025, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17426693439483643, |
|
"eval_overall_accuracy": 0.9589692269201902, |
|
"eval_overall_f1": 0.8215297450424929, |
|
"eval_overall_precision": 0.7901907356948229, |
|
"eval_overall_recall": 0.855457227138643, |
|
"eval_runtime": 0.9259, |
|
"eval_samples_per_second": 201.976, |
|
"eval_steps_per_second": 3.24, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.526695191860199, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0409, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8299319727891157, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8133333333333334, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7643312101910827, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7317073170731707, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8874172185430464, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8427672955974843, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.17505142092704773, |
|
"eval_overall_accuracy": 0.9567175381536153, |
|
"eval_overall_f1": 0.8195804195804196, |
|
"eval_overall_precision": 0.7792553191489362, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9256, |
|
"eval_samples_per_second": 202.037, |
|
"eval_steps_per_second": 3.241, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.38071247935295105, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0384, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7749999999999999, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7294117647058823, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8896321070234114, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8525641025641025, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.17447121441364288, |
|
"eval_overall_accuracy": 0.957968476357268, |
|
"eval_overall_f1": 0.8228730822873082, |
|
"eval_overall_precision": 0.7804232804232805, |
|
"eval_overall_recall": 0.8702064896755162, |
|
"eval_runtime": 0.9356, |
|
"eval_samples_per_second": 199.869, |
|
"eval_steps_per_second": 3.206, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.4309019446372986, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0385, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.8590604026845637, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.8888888888888888, |
|
"eval_ORGANIZATION_f1": 0.7757575757575759, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7111111111111111, |
|
"eval_ORGANIZATION_recall": 0.8533333333333334, |
|
"eval_PERSON_f1": 0.8874172185430464, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8427672955974843, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6428571428571429, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5454545454545454, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.18776963651180267, |
|
"eval_overall_accuracy": 0.955716787590693, |
|
"eval_overall_f1": 0.8264462809917357, |
|
"eval_overall_precision": 0.7751937984496124, |
|
"eval_overall_recall": 0.8849557522123894, |
|
"eval_runtime": 0.9372, |
|
"eval_samples_per_second": 199.53, |
|
"eval_steps_per_second": 3.201, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.0351260900497437, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0371, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8309859154929577, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8428571428571429, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.763157894736842, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7532467532467533, |
|
"eval_ORGANIZATION_recall": 0.7733333333333333, |
|
"eval_PERSON_f1": 0.8778877887788779, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.83125, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.18786616623401642, |
|
"eval_overall_accuracy": 0.9562171628721541, |
|
"eval_overall_f1": 0.8181818181818181, |
|
"eval_overall_precision": 0.7890410958904109, |
|
"eval_overall_recall": 0.8495575221238938, |
|
"eval_runtime": 0.9236, |
|
"eval_samples_per_second": 202.479, |
|
"eval_steps_per_second": 3.248, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.6741280555725098, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0385, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.7972972972972973, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7763157894736842, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7894736842105264, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7792207792207793, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8940397350993377, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8490566037735849, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.18338263034820557, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8213783403656821, |
|
"eval_overall_precision": 0.7849462365591398, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.9302, |
|
"eval_samples_per_second": 201.036, |
|
"eval_steps_per_second": 3.225, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.2608901560306549, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0359, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.816326530612245, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7777777777777777, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7241379310344828, |
|
"eval_ORGANIZATION_recall": 0.84, |
|
"eval_PERSON_f1": 0.9084745762711864, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.881578947368421, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6545454545454547, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5625, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7017543859649122, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6451612903225806, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.18453986942768097, |
|
"eval_overall_accuracy": 0.9587190392794596, |
|
"eval_overall_f1": 0.8240223463687151, |
|
"eval_overall_precision": 0.7824933687002652, |
|
"eval_overall_recall": 0.8702064896755162, |
|
"eval_runtime": 0.9321, |
|
"eval_samples_per_second": 200.623, |
|
"eval_steps_per_second": 3.219, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.7726385593414307, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0355, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.816326530612245, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7484662576687117, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6931818181818182, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.881578947368421, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8322981366459627, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20165307819843292, |
|
"eval_overall_accuracy": 0.9542156617463098, |
|
"eval_overall_f1": 0.812760055478502, |
|
"eval_overall_precision": 0.7670157068062827, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.957, |
|
"eval_samples_per_second": 195.402, |
|
"eval_steps_per_second": 3.135, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.47850877046585083, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0338, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7972972972972973, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7763157894736842, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7564102564102564, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8903654485049833, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8481012658227848, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1862517148256302, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.8215297450424929, |
|
"eval_overall_precision": 0.7901907356948229, |
|
"eval_overall_recall": 0.855457227138643, |
|
"eval_runtime": 0.9305, |
|
"eval_samples_per_second": 200.976, |
|
"eval_steps_per_second": 3.224, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 1.3503855466842651, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0376, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.8219178082191781, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8108108108108109, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7792207792207794, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.759493670886076, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8852459016393444, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8333333333333334, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5806451612903226, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1855112761259079, |
|
"eval_overall_accuracy": 0.9564673505128847, |
|
"eval_overall_f1": 0.8218793828892006, |
|
"eval_overall_precision": 0.7834224598930482, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9291, |
|
"eval_samples_per_second": 201.265, |
|
"eval_steps_per_second": 3.229, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.09078435599803925, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0324, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.816326530612245, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7564102564102564, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8675496688741723, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8238993710691824, |
|
"eval_PERSON_recall": 0.916083916083916, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5806451612903226, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19535928964614868, |
|
"eval_overall_accuracy": 0.9547160370277709, |
|
"eval_overall_f1": 0.810126582278481, |
|
"eval_overall_precision": 0.7741935483870968, |
|
"eval_overall_recall": 0.8495575221238938, |
|
"eval_runtime": 0.923, |
|
"eval_samples_per_second": 202.594, |
|
"eval_steps_per_second": 3.25, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.13197369873523712, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0361, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.8299319727891157, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8133333333333334, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7407407407407408, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6896551724137931, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8770764119601329, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8354430379746836, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.6792452830188679, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.2019178867340088, |
|
"eval_overall_accuracy": 0.9534650988241181, |
|
"eval_overall_f1": 0.8117154811715481, |
|
"eval_overall_precision": 0.7698412698412699, |
|
"eval_overall_recall": 0.8584070796460177, |
|
"eval_runtime": 0.9293, |
|
"eval_samples_per_second": 201.226, |
|
"eval_steps_per_second": 3.228, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.3539793789386749, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0329, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8243243243243243, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8026315789473685, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7468354430379747, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7108433734939759, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8741721854304637, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8301886792452831, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.72, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1934998482465744, |
|
"eval_overall_accuracy": 0.9559669752314236, |
|
"eval_overall_f1": 0.8157524613220816, |
|
"eval_overall_precision": 0.7795698924731183, |
|
"eval_overall_recall": 0.855457227138643, |
|
"eval_runtime": 0.9314, |
|
"eval_samples_per_second": 200.776, |
|
"eval_steps_per_second": 3.221, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.4102155566215515, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0336, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8590604026845637, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.8888888888888888, |
|
"eval_ORGANIZATION_f1": 0.7407407407407408, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6896551724137931, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8844884488448846, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8375, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.72, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.18642878532409668, |
|
"eval_overall_accuracy": 0.9582186639979985, |
|
"eval_overall_f1": 0.8256624825662482, |
|
"eval_overall_precision": 0.783068783068783, |
|
"eval_overall_recall": 0.8731563421828908, |
|
"eval_runtime": 0.9273, |
|
"eval_samples_per_second": 201.662, |
|
"eval_steps_per_second": 3.235, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.9542334675788879, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0346, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.8413793103448277, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8356164383561644, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.6987951807228915, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6373626373626373, |
|
"eval_ORGANIZATION_recall": 0.7733333333333333, |
|
"eval_PERSON_f1": 0.8721311475409836, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.18929119408130646, |
|
"eval_overall_accuracy": 0.9549662246685013, |
|
"eval_overall_f1": 0.8044382801664355, |
|
"eval_overall_precision": 0.7591623036649214, |
|
"eval_overall_recall": 0.855457227138643, |
|
"eval_runtime": 0.9224, |
|
"eval_samples_per_second": 202.728, |
|
"eval_steps_per_second": 3.252, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.808494508266449, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0312, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8493150684931507, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7407407407407408, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6896551724137931, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8903654485049833, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8481012658227848, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.5806451612903226, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1959969848394394, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.8212290502793296, |
|
"eval_overall_precision": 0.7798408488063661, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9295, |
|
"eval_samples_per_second": 201.192, |
|
"eval_steps_per_second": 3.228, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 1.9524306058883667, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0342, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8378378378378377, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7544910179640718, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6847826086956522, |
|
"eval_ORGANIZATION_recall": 0.84, |
|
"eval_PERSON_f1": 0.8800000000000001, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8407643312101911, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19410043954849243, |
|
"eval_overall_accuracy": 0.9554665999499625, |
|
"eval_overall_f1": 0.8183079056865463, |
|
"eval_overall_precision": 0.7722513089005235, |
|
"eval_overall_recall": 0.8702064896755162, |
|
"eval_runtime": 1.0344, |
|
"eval_samples_per_second": 180.783, |
|
"eval_steps_per_second": 2.9, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.1691898107528687, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0319, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.847682119205298, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.8888888888888888, |
|
"eval_ORGANIZATION_f1": 0.7701863354037267, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7209302325581395, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8823529411764706, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1930677443742752, |
|
"eval_overall_accuracy": 0.9582186639979985, |
|
"eval_overall_f1": 0.8236914600550964, |
|
"eval_overall_precision": 0.772609819121447, |
|
"eval_overall_recall": 0.8820058997050148, |
|
"eval_runtime": 0.9301, |
|
"eval_samples_per_second": 201.064, |
|
"eval_steps_per_second": 3.226, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 1.1448065042495728, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0293, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8322147651006712, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7500000000000001, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7058823529411765, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8712871287128713, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.825, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7547169811320754, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7407407407407407, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1969723254442215, |
|
"eval_overall_accuracy": 0.9552164123092319, |
|
"eval_overall_f1": 0.8145048814504882, |
|
"eval_overall_precision": 0.7724867724867724, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.934, |
|
"eval_samples_per_second": 200.216, |
|
"eval_steps_per_second": 3.212, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.8883477449417114, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0311, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8400000000000001, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.7530864197530864, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7011494252873564, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8823529411764706, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7777777777777779, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.18665479123592377, |
|
"eval_overall_accuracy": 0.9582186639979985, |
|
"eval_overall_f1": 0.8243430152143844, |
|
"eval_overall_precision": 0.7760416666666666, |
|
"eval_overall_recall": 0.8790560471976401, |
|
"eval_runtime": 0.9252, |
|
"eval_samples_per_second": 202.11, |
|
"eval_steps_per_second": 3.242, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.35357949137687683, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0299, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8344370860927153, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.7530864197530864, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7011494252873564, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8852459016393444, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8333333333333334, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19146093726158142, |
|
"eval_overall_accuracy": 0.9564673505128847, |
|
"eval_overall_f1": 0.8181818181818181, |
|
"eval_overall_precision": 0.7674418604651163, |
|
"eval_overall_recall": 0.8761061946902655, |
|
"eval_runtime": 0.9261, |
|
"eval_samples_per_second": 201.927, |
|
"eval_steps_per_second": 3.239, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.7683406472206116, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.03, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8219178082191781, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8108108108108109, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7354838709677418, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7125, |
|
"eval_ORGANIZATION_recall": 0.76, |
|
"eval_PERSON_f1": 0.8844884488448846, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8375, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19335182011127472, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.8140845070422535, |
|
"eval_overall_precision": 0.7789757412398922, |
|
"eval_overall_recall": 0.8525073746312685, |
|
"eval_runtime": 0.9288, |
|
"eval_samples_per_second": 201.33, |
|
"eval_steps_per_second": 3.23, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 1.1292208433151245, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0305, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.816326530612245, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7577639751552795, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7093023255813954, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8874172185430464, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8427672955974843, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1943107694387436, |
|
"eval_overall_accuracy": 0.9567175381536153, |
|
"eval_overall_f1": 0.8172942817294282, |
|
"eval_overall_precision": 0.7751322751322751, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9335, |
|
"eval_samples_per_second": 200.331, |
|
"eval_steps_per_second": 3.214, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.6603876948356628, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0306, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7945205479452054, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7577639751552795, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7093023255813954, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8823529411764706, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.19313213229179382, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8161559888579387, |
|
"eval_overall_precision": 0.7730870712401056, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9289, |
|
"eval_samples_per_second": 201.304, |
|
"eval_steps_per_second": 3.229, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.466139554977417, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0286, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.802721088435374, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7866666666666666, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7701863354037267, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7209302325581395, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8758169934640523, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8220858895705522, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19068394601345062, |
|
"eval_overall_accuracy": 0.955716787590693, |
|
"eval_overall_f1": 0.8138888888888888, |
|
"eval_overall_precision": 0.7690288713910761, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9312, |
|
"eval_samples_per_second": 200.826, |
|
"eval_steps_per_second": 3.222, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.6404593586921692, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0283, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8322147651006712, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7483870967741936, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.725, |
|
"eval_ORGANIZATION_recall": 0.7733333333333333, |
|
"eval_PERSON_f1": 0.8692810457516339, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8159509202453987, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7142857142857142, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19274306297302246, |
|
"eval_overall_accuracy": 0.957968476357268, |
|
"eval_overall_f1": 0.8105849582172702, |
|
"eval_overall_precision": 0.7678100263852242, |
|
"eval_overall_recall": 0.8584070796460177, |
|
"eval_runtime": 0.9998, |
|
"eval_samples_per_second": 187.045, |
|
"eval_steps_per_second": 3.001, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.17559492588043213, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0289, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7945205479452054, |
|
"eval_LOCATION_recall": 0.8055555555555556, |
|
"eval_ORGANIZATION_f1": 0.7500000000000001, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7058823529411765, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8750000000000001, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8260869565217391, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1927793323993683, |
|
"eval_overall_accuracy": 0.9564673505128847, |
|
"eval_overall_f1": 0.8083916083916084, |
|
"eval_overall_precision": 0.7686170212765957, |
|
"eval_overall_recall": 0.8525073746312685, |
|
"eval_runtime": 0.9268, |
|
"eval_samples_per_second": 201.759, |
|
"eval_steps_per_second": 3.237, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 1.3301130533218384, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0289, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8082191780821918, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7972972972972973, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7530864197530864, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7011494252873564, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8844884488448846, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8375, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7636363636363636, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7241379310344828, |
|
"eval_TIME_recall": 0.8076923076923077, |
|
"eval_loss": 0.19638177752494812, |
|
"eval_overall_accuracy": 0.9572179134350763, |
|
"eval_overall_f1": 0.8172942817294282, |
|
"eval_overall_precision": 0.7751322751322751, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9332, |
|
"eval_samples_per_second": 200.396, |
|
"eval_steps_per_second": 3.215, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.19960090517997742, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0283, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8053691275167787, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7792207792207793, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7564102564102564, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7283950617283951, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8823529411764706, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19612807035446167, |
|
"eval_overall_accuracy": 0.9572179134350763, |
|
"eval_overall_f1": 0.8145048814504882, |
|
"eval_overall_precision": 0.7724867724867724, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.9383, |
|
"eval_samples_per_second": 199.303, |
|
"eval_steps_per_second": 3.197, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.7677280306816101, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0279, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.7919463087248323, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7662337662337663, |
|
"eval_LOCATION_recall": 0.8194444444444444, |
|
"eval_ORGANIZATION_f1": 0.7564102564102564, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7283950617283951, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8786885245901639, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8271604938271605, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20059086382389069, |
|
"eval_overall_accuracy": 0.9549662246685013, |
|
"eval_overall_f1": 0.8089260808926081, |
|
"eval_overall_precision": 0.7671957671957672, |
|
"eval_overall_recall": 0.855457227138643, |
|
"eval_runtime": 0.9285, |
|
"eval_samples_per_second": 201.396, |
|
"eval_steps_per_second": 3.231, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.65785813331604, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0288, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8053691275167787, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7792207792207793, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7701863354037267, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7209302325581395, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8758169934640523, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8220858895705522, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20255452394485474, |
|
"eval_overall_accuracy": 0.9559669752314236, |
|
"eval_overall_f1": 0.8144044321329639, |
|
"eval_overall_precision": 0.7676240208877284, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9402, |
|
"eval_samples_per_second": 198.885, |
|
"eval_steps_per_second": 3.191, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 1.4090750217437744, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0275, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8026315789473685, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7450980392156863, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7307692307692307, |
|
"eval_ORGANIZATION_recall": 0.76, |
|
"eval_PERSON_f1": 0.8831168831168831, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.951048951048951, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19975264370441437, |
|
"eval_overall_accuracy": 0.9569677257943457, |
|
"eval_overall_f1": 0.812239221140473, |
|
"eval_overall_precision": 0.7684210526315789, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.9248, |
|
"eval_samples_per_second": 202.217, |
|
"eval_steps_per_second": 3.244, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.6550692319869995, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0272, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7515151515151515, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.6888888888888889, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8794788273615636, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.823170731707317, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.19843065738677979, |
|
"eval_overall_accuracy": 0.9562171628721541, |
|
"eval_overall_f1": 0.8159340659340658, |
|
"eval_overall_precision": 0.7634961439588689, |
|
"eval_overall_recall": 0.8761061946902655, |
|
"eval_runtime": 0.9223, |
|
"eval_samples_per_second": 202.76, |
|
"eval_steps_per_second": 3.253, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 1.794690489768982, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0265, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8275862068965517, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.821917808219178, |
|
"eval_LOCATION_recall": 0.8333333333333334, |
|
"eval_ORGANIZATION_f1": 0.7770700636942677, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7439024390243902, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8823529411764706, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.9440559440559441, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20021091401576996, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.8223776223776224, |
|
"eval_overall_precision": 0.7819148936170213, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9203, |
|
"eval_samples_per_second": 203.198, |
|
"eval_steps_per_second": 3.26, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.0694357305765152, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0258, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8187919463087249, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7922077922077922, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7547169811320756, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7142857142857143, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8729641693811075, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8170731707317073, |
|
"eval_PERSON_recall": 0.9370629370629371, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.1959146112203598, |
|
"eval_overall_accuracy": 0.9574681010758068, |
|
"eval_overall_f1": 0.812760055478502, |
|
"eval_overall_precision": 0.7670157068062827, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9378, |
|
"eval_samples_per_second": 199.393, |
|
"eval_steps_per_second": 3.199, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.7855161428451538, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0256, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8344370860927153, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.7625, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7176470588235294, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.868421052631579, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8198757763975155, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20366288721561432, |
|
"eval_overall_accuracy": 0.955716787590693, |
|
"eval_overall_f1": 0.8166666666666667, |
|
"eval_overall_precision": 0.7716535433070866, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9223, |
|
"eval_samples_per_second": 202.758, |
|
"eval_steps_per_second": 3.253, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.923471212387085, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.026, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.779874213836478, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7380952380952381, |
|
"eval_ORGANIZATION_recall": 0.8266666666666667, |
|
"eval_PERSON_f1": 0.8712871287128713, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.825, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7272727272727274, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.6896551724137931, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20790377259254456, |
|
"eval_overall_accuracy": 0.9547160370277709, |
|
"eval_overall_f1": 0.8166666666666667, |
|
"eval_overall_precision": 0.7716535433070866, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9308, |
|
"eval_samples_per_second": 200.901, |
|
"eval_steps_per_second": 3.223, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.5129814147949219, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0269, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7672955974842767, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7261904761904762, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.868421052631579, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8198757763975155, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.2034631371498108, |
|
"eval_overall_accuracy": 0.9552164123092319, |
|
"eval_overall_f1": 0.8138888888888888, |
|
"eval_overall_precision": 0.7690288713910761, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.9303, |
|
"eval_samples_per_second": 201.002, |
|
"eval_steps_per_second": 3.225, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.9843897819519043, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0254, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7625, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7176470588235294, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8721311475409836, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20722047984600067, |
|
"eval_overall_accuracy": 0.9549662246685013, |
|
"eval_overall_f1": 0.8144044321329639, |
|
"eval_overall_precision": 0.7676240208877284, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9384, |
|
"eval_samples_per_second": 199.274, |
|
"eval_steps_per_second": 3.197, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.45156100392341614, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0255, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.8344370860927153, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.875, |
|
"eval_ORGANIZATION_f1": 0.759493670886076, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7228915662650602, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.868421052631579, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8198757763975155, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20072737336158752, |
|
"eval_overall_accuracy": 0.9554665999499625, |
|
"eval_overall_f1": 0.8150208623087621, |
|
"eval_overall_precision": 0.7710526315789473, |
|
"eval_overall_recall": 0.8643067846607669, |
|
"eval_runtime": 0.93, |
|
"eval_samples_per_second": 201.077, |
|
"eval_steps_per_second": 3.226, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.905977725982666, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0248, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7612903225806452, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7375, |
|
"eval_ORGANIZATION_recall": 0.7866666666666666, |
|
"eval_PERSON_f1": 0.8721311475409836, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.201884463429451, |
|
"eval_overall_accuracy": 0.955716787590693, |
|
"eval_overall_f1": 0.8145048814504882, |
|
"eval_overall_precision": 0.7724867724867724, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.9411, |
|
"eval_samples_per_second": 198.713, |
|
"eval_steps_per_second": 3.188, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.701413631439209, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0258, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.759493670886076, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7228915662650602, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.868421052631579, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8198757763975155, |
|
"eval_PERSON_recall": 0.9230769230769231, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20242148637771606, |
|
"eval_overall_accuracy": 0.9554665999499625, |
|
"eval_overall_f1": 0.812239221140473, |
|
"eval_overall_precision": 0.7684210526315789, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.9222, |
|
"eval_samples_per_second": 202.767, |
|
"eval_steps_per_second": 3.253, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.5330938696861267, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0251, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8611111111111112, |
|
"eval_ORGANIZATION_f1": 0.7721518987341773, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7349397590361446, |
|
"eval_ORGANIZATION_recall": 0.8133333333333334, |
|
"eval_PERSON_f1": 0.8721311475409836, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.2052735686302185, |
|
"eval_overall_accuracy": 0.9559669752314236, |
|
"eval_overall_f1": 0.8166666666666667, |
|
"eval_overall_precision": 0.7716535433070866, |
|
"eval_overall_recall": 0.8672566371681416, |
|
"eval_runtime": 0.9322, |
|
"eval_samples_per_second": 200.61, |
|
"eval_steps_per_second": 3.218, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.6201446652412415, |
|
"learning_rate": 0.0, |
|
"loss": 0.0255, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 72, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8472222222222222, |
|
"eval_ORGANIZATION_f1": 0.7643312101910827, |
|
"eval_ORGANIZATION_number": 75, |
|
"eval_ORGANIZATION_precision": 0.7317073170731707, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8721311475409836, |
|
"eval_PERSON_number": 143, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.9300699300699301, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 23, |
|
"eval_QUANTITY_precision": 0.6206896551724138, |
|
"eval_QUANTITY_recall": 0.782608695652174, |
|
"eval_TIME_f1": 0.7407407407407408, |
|
"eval_TIME_number": 26, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.7692307692307693, |
|
"eval_loss": 0.20351509749889374, |
|
"eval_overall_accuracy": 0.9554665999499625, |
|
"eval_overall_f1": 0.8133704735376045, |
|
"eval_overall_precision": 0.7704485488126649, |
|
"eval_overall_recall": 0.8613569321533924, |
|
"eval_runtime": 0.9365, |
|
"eval_samples_per_second": 199.684, |
|
"eval_steps_per_second": 3.203, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5023623771566022.0, |
|
"train_loss": 0.07431833881252217, |
|
"train_runtime": 1320.4476, |
|
"train_samples_per_second": 127.76, |
|
"train_steps_per_second": 8.028 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5023623771566022.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|