|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 1.1115612983703613, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9255, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012820512820512818, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.25, |
|
"eval_PERSON_recall": 0.006578947368421052, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.6139789819717407, |
|
"eval_overall_accuracy": 0.8402048655569783, |
|
"eval_overall_f1": 0.005847953216374269, |
|
"eval_overall_precision": 0.25, |
|
"eval_overall_recall": 0.0029585798816568047, |
|
"eval_runtime": 0.288, |
|
"eval_samples_per_second": 649.255, |
|
"eval_steps_per_second": 10.416, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.1083379983901978, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.5503, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.09523809523809525, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.26666666666666666, |
|
"eval_LOCATION_recall": 0.057971014492753624, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.5272727272727272, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.4887640449438202, |
|
"eval_PERSON_recall": 0.5723684210526315, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.4, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.5625, |
|
"eval_TIME_recall": 0.3103448275862069, |
|
"eval_loss": 0.3994744122028351, |
|
"eval_overall_accuracy": 0.8855313700384123, |
|
"eval_overall_f1": 0.35714285714285715, |
|
"eval_overall_precision": 0.45045045045045046, |
|
"eval_overall_recall": 0.2958579881656805, |
|
"eval_runtime": 0.2908, |
|
"eval_samples_per_second": 642.974, |
|
"eval_steps_per_second": 10.315, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.8157479763031006, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.3808, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.5454545454545455, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.49411764705882355, |
|
"eval_LOCATION_recall": 0.6086956521739131, |
|
"eval_ORGANIZATION_f1": 0.2978723404255319, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.3888888888888889, |
|
"eval_ORGANIZATION_recall": 0.2413793103448276, |
|
"eval_PERSON_f1": 0.735632183908046, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.6530612244897959, |
|
"eval_PERSON_recall": 0.8421052631578947, |
|
"eval_QUANTITY_f1": 0.28571428571428564, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.2727272727272727, |
|
"eval_QUANTITY_recall": 0.3, |
|
"eval_TIME_f1": 0.6785714285714286, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7037037037037037, |
|
"eval_TIME_recall": 0.6551724137931034, |
|
"eval_loss": 0.28895071148872375, |
|
"eval_overall_accuracy": 0.9267605633802817, |
|
"eval_overall_f1": 0.5930069930069929, |
|
"eval_overall_precision": 0.5623342175066313, |
|
"eval_overall_recall": 0.6272189349112426, |
|
"eval_runtime": 0.2887, |
|
"eval_samples_per_second": 647.772, |
|
"eval_steps_per_second": 10.392, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.4652637243270874, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2833, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.6455696202531644, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5730337078651685, |
|
"eval_LOCATION_recall": 0.7391304347826086, |
|
"eval_ORGANIZATION_f1": 0.4642857142857143, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.48148148148148145, |
|
"eval_ORGANIZATION_recall": 0.4482758620689655, |
|
"eval_PERSON_f1": 0.7904191616766467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7252747252747253, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.47058823529411764, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.42105263157894735, |
|
"eval_QUANTITY_recall": 0.5333333333333333, |
|
"eval_TIME_f1": 0.8275862068965517, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.21562312543392181, |
|
"eval_overall_accuracy": 0.9405889884763124, |
|
"eval_overall_f1": 0.6821917808219178, |
|
"eval_overall_precision": 0.6352040816326531, |
|
"eval_overall_recall": 0.7366863905325444, |
|
"eval_runtime": 0.2884, |
|
"eval_samples_per_second": 648.345, |
|
"eval_steps_per_second": 10.401, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.5371237993240356, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.2213, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.725, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6373626373626373, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.5263157894736843, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5357142857142857, |
|
"eval_ORGANIZATION_recall": 0.5172413793103449, |
|
"eval_PERSON_f1": 0.8012048192771084, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7388888888888889, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.5333333333333333, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.4444444444444444, |
|
"eval_QUANTITY_recall": 0.6666666666666666, |
|
"eval_TIME_f1": 0.8275862068965517, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.18281985819339752, |
|
"eval_overall_accuracy": 0.9434058898847631, |
|
"eval_overall_f1": 0.7171853856562923, |
|
"eval_overall_precision": 0.6608478802992519, |
|
"eval_overall_recall": 0.7840236686390533, |
|
"eval_runtime": 0.2945, |
|
"eval_samples_per_second": 634.984, |
|
"eval_steps_per_second": 10.187, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.388359546661377, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1845, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7721518987341773, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6853932584269663, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.5757575757575758, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5135135135135135, |
|
"eval_ORGANIZATION_recall": 0.6551724137931034, |
|
"eval_PERSON_f1": 0.8192771084337349, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7555555555555555, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.5714285714285715, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5, |
|
"eval_QUANTITY_recall": 0.6666666666666666, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1697721779346466, |
|
"eval_overall_accuracy": 0.9467349551856594, |
|
"eval_overall_f1": 0.7446808510638298, |
|
"eval_overall_precision": 0.6763285024154589, |
|
"eval_overall_recall": 0.8284023668639053, |
|
"eval_runtime": 0.2919, |
|
"eval_samples_per_second": 640.647, |
|
"eval_steps_per_second": 10.278, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.574262261390686, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.17, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.8026315789473685, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6016260162601627, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5692307692307692, |
|
"eval_ORGANIZATION_recall": 0.6379310344827587, |
|
"eval_PERSON_f1": 0.8246153846153845, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7745664739884393, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1523420363664627, |
|
"eval_overall_accuracy": 0.9510883482714468, |
|
"eval_overall_f1": 0.7741046831955923, |
|
"eval_overall_precision": 0.7242268041237113, |
|
"eval_overall_recall": 0.8313609467455622, |
|
"eval_runtime": 0.292, |
|
"eval_samples_per_second": 640.421, |
|
"eval_steps_per_second": 10.274, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.5678428411483765, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1552, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.8266666666666668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.5891472868217055, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5352112676056338, |
|
"eval_ORGANIZATION_recall": 0.6551724137931034, |
|
"eval_PERSON_f1": 0.8307692307692307, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7803468208092486, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14812210202217102, |
|
"eval_overall_accuracy": 0.9518565941101153, |
|
"eval_overall_f1": 0.7759562841530055, |
|
"eval_overall_precision": 0.7208121827411168, |
|
"eval_overall_recall": 0.8402366863905325, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.864, |
|
"eval_steps_per_second": 10.474, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.5933927297592163, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1486, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.8299319727891156, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.5853658536585366, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5538461538461539, |
|
"eval_ORGANIZATION_recall": 0.6206896551724138, |
|
"eval_PERSON_f1": 0.8427672955974843, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8072289156626506, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1388072818517685, |
|
"eval_overall_accuracy": 0.9544174135723431, |
|
"eval_overall_f1": 0.7860139860139861, |
|
"eval_overall_precision": 0.7453580901856764, |
|
"eval_overall_recall": 0.8313609467455622, |
|
"eval_runtime": 0.2922, |
|
"eval_samples_per_second": 640.03, |
|
"eval_steps_per_second": 10.268, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.51088547706604, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1369, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.8243243243243245, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6141732283464567, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5652173913043478, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.8348909657320872, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7928994082840237, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13908080756664276, |
|
"eval_overall_accuracy": 0.9549295774647887, |
|
"eval_overall_f1": 0.7802197802197802, |
|
"eval_overall_precision": 0.7282051282051282, |
|
"eval_overall_recall": 0.8402366863905325, |
|
"eval_runtime": 0.2918, |
|
"eval_samples_per_second": 640.865, |
|
"eval_steps_per_second": 10.281, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 1.4912283420562744, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.132, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6299212598425198, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5797101449275363, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.8473520249221184, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8047337278106509, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7812500000000001, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14170250296592712, |
|
"eval_overall_accuracy": 0.953393085787452, |
|
"eval_overall_f1": 0.7928669410150891, |
|
"eval_overall_precision": 0.7391304347826086, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.2921, |
|
"eval_samples_per_second": 640.286, |
|
"eval_steps_per_second": 10.272, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 2.726284980773926, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1268, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6140350877192983, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.603448275862069, |
|
"eval_PERSON_f1": 0.8517350157728707, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8181818181818182, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13159815967082977, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8016997167138811, |
|
"eval_overall_precision": 0.7690217391304348, |
|
"eval_overall_recall": 0.8372781065088757, |
|
"eval_runtime": 0.2918, |
|
"eval_samples_per_second": 640.768, |
|
"eval_steps_per_second": 10.28, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.7623488903045654, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1206, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6115702479338844, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5873015873015873, |
|
"eval_ORGANIZATION_recall": 0.6379310344827587, |
|
"eval_PERSON_f1": 0.8526645768025078, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13245752453804016, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.8011204481792716, |
|
"eval_overall_precision": 0.7606382978723404, |
|
"eval_overall_recall": 0.8461538461538461, |
|
"eval_runtime": 0.2913, |
|
"eval_samples_per_second": 641.931, |
|
"eval_steps_per_second": 10.298, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 3.348172664642334, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1186, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7299270072992702, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6329113924050633, |
|
"eval_ORGANIZATION_recall": 0.8620689655172413, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8095238095238095, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13963258266448975, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8158253751705321, |
|
"eval_overall_precision": 0.7569620253164557, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.876, |
|
"eval_steps_per_second": 10.474, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.2007865905761719, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1141, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6333333333333333, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6129032258064516, |
|
"eval_ORGANIZATION_recall": 0.6551724137931034, |
|
"eval_PERSON_f1": 0.8481012658227848, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8170731707317073, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1281883716583252, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.8022598870056498, |
|
"eval_overall_precision": 0.7675675675675676, |
|
"eval_overall_recall": 0.8402366863905325, |
|
"eval_runtime": 0.2866, |
|
"eval_samples_per_second": 652.52, |
|
"eval_steps_per_second": 10.468, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.8597108721733093, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1083, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7131782945736435, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8526645768025078, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1355670541524887, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8149171270718233, |
|
"eval_overall_precision": 0.7642487046632125, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2918, |
|
"eval_samples_per_second": 640.866, |
|
"eval_steps_per_second": 10.281, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.9207751154899597, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.1106, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6612903225806452, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6212121212121212, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8517350157728707, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8181818181818182, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1327420026063919, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8089260808926082, |
|
"eval_overall_precision": 0.7651715039577837, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.2911, |
|
"eval_samples_per_second": 642.326, |
|
"eval_steps_per_second": 10.305, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 2.323946952819824, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.1053, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6611570247933884, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6349206349206349, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8095238095238095, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7246376811594204, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1359253227710724, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8044382801664354, |
|
"eval_overall_precision": 0.7571801566579635, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.2865, |
|
"eval_samples_per_second": 652.807, |
|
"eval_steps_per_second": 10.473, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 24.915828704833984, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.1089, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8450704225352113, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.821917808219178, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.584070796460177, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.5689655172413793, |
|
"eval_PERSON_f1": 0.8471337579617835, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.8, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.12435611337423325, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8023088023088024, |
|
"eval_overall_precision": 0.7830985915492957, |
|
"eval_overall_recall": 0.8224852071005917, |
|
"eval_runtime": 0.2922, |
|
"eval_samples_per_second": 640.081, |
|
"eval_steps_per_second": 10.269, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.8912884593009949, |
|
"learning_rate": 4e-05, |
|
"loss": 0.1046, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6779661016949153, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.85625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8154761904761905, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12911909818649292, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8117977528089887, |
|
"eval_overall_precision": 0.7727272727272727, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.2932, |
|
"eval_samples_per_second": 637.792, |
|
"eval_steps_per_second": 10.232, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 0.48920294642448425, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0965, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.84, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7424242424242424, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6621621621621622, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.875, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8333333333333334, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1389300525188446, |
|
"eval_overall_accuracy": 0.9572343149807938, |
|
"eval_overall_f1": 0.8246575342465754, |
|
"eval_overall_precision": 0.7678571428571429, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.2936, |
|
"eval_samples_per_second": 637.017, |
|
"eval_steps_per_second": 10.22, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 1.2225427627563477, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0958, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7633587786259542, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.684931506849315, |
|
"eval_ORGANIZATION_recall": 0.8620689655172413, |
|
"eval_PERSON_f1": 0.8544303797468354, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.823170731707317, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1278899759054184, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8328690807799444, |
|
"eval_overall_precision": 0.7868421052631579, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2942, |
|
"eval_samples_per_second": 635.574, |
|
"eval_steps_per_second": 10.196, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.5433982014656067, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0929, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8591549295774648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8356164383561644, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6499999999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6290322580645161, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12278664112091064, |
|
"eval_overall_accuracy": 0.9628681177976952, |
|
"eval_overall_f1": 0.8176638176638177, |
|
"eval_overall_precision": 0.7884615384615384, |
|
"eval_overall_recall": 0.849112426035503, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 638.552, |
|
"eval_steps_per_second": 10.244, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.4073636531829834, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0934, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.746268656716418, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6578947368421053, |
|
"eval_ORGANIZATION_recall": 0.8620689655172413, |
|
"eval_PERSON_f1": 0.8509316770186336, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8058823529411765, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13569365441799164, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8285322359396433, |
|
"eval_overall_precision": 0.7723785166240409, |
|
"eval_overall_recall": 0.893491124260355, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.683, |
|
"eval_steps_per_second": 10.262, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 2.3010127544403076, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0887, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8435374149659864, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7948717948717948, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7166666666666668, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6935483870967742, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8535031847133758, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8271604938271605, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12316982448101044, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8198581560283689, |
|
"eval_overall_precision": 0.7874659400544959, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.601, |
|
"eval_steps_per_second": 10.245, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 1.5638922452926636, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.1025, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7716535433070866, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7101449275362319, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1349707692861557, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8312412831241283, |
|
"eval_overall_precision": 0.7862796833773087, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 638.525, |
|
"eval_steps_per_second": 10.244, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.3527199029922485, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0868, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7777777777777778, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7205882352941176, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1333594173192978, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8328690807799444, |
|
"eval_overall_precision": 0.7868421052631579, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.845, |
|
"eval_steps_per_second": 10.265, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 2.2402167320251465, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0836, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7419354838709677, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.696969696969697, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.1318032443523407, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8212290502793296, |
|
"eval_overall_precision": 0.7777777777777778, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.756, |
|
"eval_steps_per_second": 10.263, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 1.1857041120529175, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0791, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.746031746031746, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6911764705882353, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.85625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8154761904761905, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13442517817020416, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8256624825662484, |
|
"eval_overall_precision": 0.7810026385224275, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2926, |
|
"eval_samples_per_second": 639.174, |
|
"eval_steps_per_second": 10.254, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.6588788032531738, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0792, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6885245901639344, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8643533123028391, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12328661233186722, |
|
"eval_overall_accuracy": 0.9651728553137003, |
|
"eval_overall_f1": 0.8312056737588652, |
|
"eval_overall_precision": 0.7983651226158038, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.287, |
|
"eval_samples_per_second": 651.586, |
|
"eval_steps_per_second": 10.453, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.4727123975753784, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0772, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7317073170731708, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8652037617554859, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8263473053892215, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1277562379837036, |
|
"eval_overall_accuracy": 0.9646606914212548, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2916, |
|
"eval_samples_per_second": 641.192, |
|
"eval_steps_per_second": 10.287, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.8663144111633301, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0766, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7244094488188977, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8544303797468354, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.823170731707317, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12748569250106812, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8258426966292135, |
|
"eval_overall_precision": 0.786096256684492, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.287, |
|
"eval_samples_per_second": 651.573, |
|
"eval_steps_per_second": 10.453, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.6088622808456421, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0746, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7401574803149606, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6811594202898551, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8507936507936509, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8220858895705522, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.8253968253968254, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7878787878787878, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13140520453453064, |
|
"eval_overall_accuracy": 0.9636363636363636, |
|
"eval_overall_f1": 0.8286516853932584, |
|
"eval_overall_precision": 0.7887700534759359, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.293, |
|
"eval_samples_per_second": 638.168, |
|
"eval_steps_per_second": 10.238, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.8929836750030518, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.072, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7559055118110236, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6956521739130435, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8626198083067094, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8385093167701864, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.8253968253968254, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7878787878787878, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13353487849235535, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8366197183098592, |
|
"eval_overall_precision": 0.7983870967741935, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.293, |
|
"eval_samples_per_second": 638.242, |
|
"eval_steps_per_second": 10.239, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 1.197149634361267, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0712, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7377049180327868, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.703125, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8214285714285714, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.8, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13137878477573395, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8347338935574229, |
|
"eval_overall_precision": 0.7925531914893617, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.975, |
|
"eval_steps_per_second": 10.476, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.49242687225341797, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0702, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7230769230769231, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6527777777777778, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8626198083067094, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8385093167701864, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.8253968253968254, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7878787878787878, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13032355904579163, |
|
"eval_overall_accuracy": 0.9641485275288092, |
|
"eval_overall_f1": 0.8293370944992947, |
|
"eval_overall_precision": 0.7924528301886793, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.2939, |
|
"eval_samples_per_second": 636.252, |
|
"eval_steps_per_second": 10.207, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 2.0146589279174805, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0695, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7580645161290323, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7121212121212122, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12965013086795807, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.840620592383639, |
|
"eval_overall_precision": 0.8032345013477089, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 638.49, |
|
"eval_steps_per_second": 10.243, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.8112408518791199, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0674, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7419354838709677, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.696969696969697, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8706624605678233, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1362360268831253, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8363636363636363, |
|
"eval_overall_precision": 0.7931034482758621, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 638.407, |
|
"eval_steps_per_second": 10.242, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.4772998094558716, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0653, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6942148760330579, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12953267991542816, |
|
"eval_overall_accuracy": 0.964404609475032, |
|
"eval_overall_f1": 0.8271954674220963, |
|
"eval_overall_precision": 0.7934782608695652, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.701, |
|
"eval_steps_per_second": 10.247, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 1.1962645053863525, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0637, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8533333333333333, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8761904761904762, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13492895662784576, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8330995792426368, |
|
"eval_overall_precision": 0.792, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2867, |
|
"eval_samples_per_second": 652.21, |
|
"eval_steps_per_second": 10.463, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.6804232597351074, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0634, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7619047619047619, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7058823529411765, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8742138364779874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1353294402360916, |
|
"eval_overall_accuracy": 0.9651728553137003, |
|
"eval_overall_f1": 0.8410689170182841, |
|
"eval_overall_precision": 0.8016085790884718, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2941, |
|
"eval_samples_per_second": 635.842, |
|
"eval_steps_per_second": 10.201, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 1.3958626985549927, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0622, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7154471544715447, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.676923076923077, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8769716088328074, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13502123951911926, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8377997179125528, |
|
"eval_overall_precision": 0.8005390835579514, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2888, |
|
"eval_samples_per_second": 647.481, |
|
"eval_steps_per_second": 10.387, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 1.7736326456069946, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0616, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.752, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7014925373134329, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8742138364779874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1341027021408081, |
|
"eval_overall_accuracy": 0.9654289372599232, |
|
"eval_overall_f1": 0.8455056179775281, |
|
"eval_overall_precision": 0.8048128342245989, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.2927, |
|
"eval_samples_per_second": 638.914, |
|
"eval_steps_per_second": 10.25, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 4.0435028076171875, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0603, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8476821192052981, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7286821705426356, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8714733542319749, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8323353293413174, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14106552302837372, |
|
"eval_overall_accuracy": 0.9628681177976952, |
|
"eval_overall_f1": 0.8310249307479224, |
|
"eval_overall_precision": 0.78125, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.2883, |
|
"eval_samples_per_second": 648.632, |
|
"eval_steps_per_second": 10.406, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.2470722198486328, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0597, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7286821705426356, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8652037617554859, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8263473053892215, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14016938209533691, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8243430152143846, |
|
"eval_overall_precision": 0.7740259740259741, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.618, |
|
"eval_steps_per_second": 10.245, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.7653511762619019, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.059, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6865671641791045, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13417667150497437, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2925, |
|
"eval_samples_per_second": 639.217, |
|
"eval_steps_per_second": 10.255, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 1.0474615097045898, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0574, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6865671641791045, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7796610169491527, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7666666666666667, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.13553491234779358, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8258426966292135, |
|
"eval_overall_precision": 0.786096256684492, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.657, |
|
"eval_steps_per_second": 10.246, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 1.1858253479003906, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0581, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7377049180327868, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.703125, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13520203530788422, |
|
"eval_overall_accuracy": 0.9659411011523688, |
|
"eval_overall_f1": 0.8389830508474576, |
|
"eval_overall_precision": 0.8027027027027027, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2932, |
|
"eval_samples_per_second": 637.868, |
|
"eval_steps_per_second": 10.233, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.4307897090911865, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0561, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8679245283018868, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13861991465091705, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8398876404494382, |
|
"eval_overall_precision": 0.7994652406417112, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2889, |
|
"eval_samples_per_second": 647.316, |
|
"eval_steps_per_second": 10.385, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.8664003014564514, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0544, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6865671641791045, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8471337579617835, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13451269268989563, |
|
"eval_overall_accuracy": 0.9651728553137003, |
|
"eval_overall_f1": 0.8312056737588652, |
|
"eval_overall_precision": 0.7983651226158038, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.2869, |
|
"eval_samples_per_second": 651.752, |
|
"eval_steps_per_second": 10.456, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 3.4700815677642822, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0534, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7692307692307692, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6944444444444444, |
|
"eval_ORGANIZATION_recall": 0.8620689655172413, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13688045740127563, |
|
"eval_overall_accuracy": 0.9651728553137003, |
|
"eval_overall_f1": 0.841514726507714, |
|
"eval_overall_precision": 0.8, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.2922, |
|
"eval_samples_per_second": 640.064, |
|
"eval_steps_per_second": 10.268, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 1.2102717161178589, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0521, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7669172932330827, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.68, |
|
"eval_ORGANIZATION_recall": 0.8793103448275862, |
|
"eval_PERSON_f1": 0.8643533123028391, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14608342945575714, |
|
"eval_overall_accuracy": 0.9628681177976952, |
|
"eval_overall_f1": 0.8337950138504154, |
|
"eval_overall_precision": 0.7838541666666666, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.2926, |
|
"eval_samples_per_second": 639.189, |
|
"eval_steps_per_second": 10.254, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 1.385406732559204, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0524, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.768, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7164179104477612, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1376073956489563, |
|
"eval_overall_accuracy": 0.9656850192061459, |
|
"eval_overall_f1": 0.8410689170182841, |
|
"eval_overall_precision": 0.8016085790884718, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2926, |
|
"eval_samples_per_second": 639.014, |
|
"eval_steps_per_second": 10.252, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.37542441487312317, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0494, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7401574803149606, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6811594202898551, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14096996188163757, |
|
"eval_overall_accuracy": 0.9659411011523688, |
|
"eval_overall_f1": 0.8398876404494382, |
|
"eval_overall_precision": 0.7994652406417112, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2945, |
|
"eval_samples_per_second": 635.027, |
|
"eval_steps_per_second": 10.188, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 2.3441622257232666, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0516, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7559055118110236, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6956521739130435, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13822495937347412, |
|
"eval_overall_accuracy": 0.9659411011523688, |
|
"eval_overall_f1": 0.8455056179775281, |
|
"eval_overall_precision": 0.8048128342245989, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.657, |
|
"eval_steps_per_second": 10.246, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.9206390976905823, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0497, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7200000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6716417910447762, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8571428571428571, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13933928310871124, |
|
"eval_overall_accuracy": 0.9654289372599232, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.293, |
|
"eval_samples_per_second": 638.123, |
|
"eval_steps_per_second": 10.237, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.8336784839630127, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.048, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.752, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7014925373134329, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14417044818401337, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8347338935574229, |
|
"eval_overall_precision": 0.7925531914893617, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2919, |
|
"eval_samples_per_second": 640.597, |
|
"eval_steps_per_second": 10.277, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 1.4807782173156738, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0474, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7480916030534351, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6712328767123288, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8589341692789968, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.14203424751758575, |
|
"eval_overall_accuracy": 0.9646606914212548, |
|
"eval_overall_f1": 0.8372739916550764, |
|
"eval_overall_precision": 0.7900262467191601, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.2926, |
|
"eval_samples_per_second": 639.123, |
|
"eval_steps_per_second": 10.253, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 1.1692790985107422, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0447, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6857142857142857, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8643533123028391, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1469813734292984, |
|
"eval_overall_accuracy": 0.9646606914212548, |
|
"eval_overall_f1": 0.8363636363636363, |
|
"eval_overall_precision": 0.7931034482758621, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.293, |
|
"eval_samples_per_second": 638.282, |
|
"eval_steps_per_second": 10.24, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.8121991157531738, |
|
"learning_rate": 2e-05, |
|
"loss": 0.045, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.8125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14526785910129547, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8330995792426368, |
|
"eval_overall_precision": 0.792, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2933, |
|
"eval_samples_per_second": 637.529, |
|
"eval_steps_per_second": 10.228, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.9558350443840027, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0441, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7244094488188977, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1430891752243042, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8349788434414668, |
|
"eval_overall_precision": 0.7978436657681941, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.286, |
|
"eval_samples_per_second": 653.776, |
|
"eval_steps_per_second": 10.488, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 1.2547602653503418, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0474, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1453644037246704, |
|
"eval_overall_accuracy": 0.9646606914212548, |
|
"eval_overall_f1": 0.8307692307692308, |
|
"eval_overall_precision": 0.7877984084880637, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.286, |
|
"eval_samples_per_second": 653.787, |
|
"eval_steps_per_second": 10.489, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.2882705628871918, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0441, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8706624605678233, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.14318965375423431, |
|
"eval_overall_accuracy": 0.9651728553137003, |
|
"eval_overall_f1": 0.8382559774964837, |
|
"eval_overall_precision": 0.7989276139410187, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2869, |
|
"eval_samples_per_second": 651.819, |
|
"eval_steps_per_second": 10.457, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 1.046625018119812, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0449, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8590604026845639, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7034482758620689, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5862068965517241, |
|
"eval_ORGANIZATION_recall": 0.8793103448275862, |
|
"eval_PERSON_f1": 0.8598130841121495, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8165680473372781, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.16219820082187653, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8178137651821863, |
|
"eval_overall_precision": 0.7518610421836228, |
|
"eval_overall_recall": 0.8964497041420119, |
|
"eval_runtime": 0.2859, |
|
"eval_samples_per_second": 654.058, |
|
"eval_steps_per_second": 10.493, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.8243094682693481, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0452, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7424242424242424, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6621621621621622, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.85625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8154761904761905, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.14889490604400635, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8349514563106797, |
|
"eval_overall_precision": 0.7859007832898173, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.2885, |
|
"eval_samples_per_second": 648.163, |
|
"eval_steps_per_second": 10.398, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.7773322463035583, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0418, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7480916030534351, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6712328767123288, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8214285714285714, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.15430662035942078, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8349514563106797, |
|
"eval_overall_precision": 0.7859007832898173, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.682, |
|
"eval_steps_per_second": 10.262, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.9151946306228638, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0421, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7538461538461538, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6805555555555556, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8589341692789968, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.15378881990909576, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8321775312066575, |
|
"eval_overall_precision": 0.783289817232376, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.2921, |
|
"eval_samples_per_second": 640.251, |
|
"eval_steps_per_second": 10.271, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.4768742322921753, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.041, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7518796992481203, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8620689655172413, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.15490765869617462, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8294036061026352, |
|
"eval_overall_precision": 0.7806788511749347, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2858, |
|
"eval_samples_per_second": 654.293, |
|
"eval_steps_per_second": 10.497, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 1.6758042573928833, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0411, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7401574803149606, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6811594202898551, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8553459119496855, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15107131004333496, |
|
"eval_overall_accuracy": 0.9651728553137003, |
|
"eval_overall_f1": 0.8347338935574229, |
|
"eval_overall_precision": 0.7925531914893617, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2937, |
|
"eval_samples_per_second": 636.611, |
|
"eval_steps_per_second": 10.213, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 1.7515956163406372, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0414, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8214285714285714, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.15384884178638458, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8250000000000001, |
|
"eval_overall_precision": 0.7774869109947644, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2872, |
|
"eval_samples_per_second": 651.192, |
|
"eval_steps_per_second": 10.447, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 1.0327603816986084, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0407, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7384615384615385, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1484140008687973, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8375350140056023, |
|
"eval_overall_precision": 0.7952127659574468, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.759, |
|
"eval_steps_per_second": 10.264, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 1.021155595779419, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0395, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7419354838709677, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.696969696969697, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.14668720960617065, |
|
"eval_overall_accuracy": 0.9649167733674776, |
|
"eval_overall_f1": 0.8385269121813032, |
|
"eval_overall_precision": 0.8043478260869565, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2936, |
|
"eval_samples_per_second": 636.931, |
|
"eval_steps_per_second": 10.218, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.8261666893959045, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0388, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7441860465116279, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.676056338028169, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.14678049087524414, |
|
"eval_overall_accuracy": 0.9651728553137003, |
|
"eval_overall_f1": 0.8387096774193548, |
|
"eval_overall_precision": 0.7973333333333333, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2943, |
|
"eval_samples_per_second": 635.507, |
|
"eval_steps_per_second": 10.195, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.6623172760009766, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0401, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7441860465116279, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.676056338028169, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15321803092956543, |
|
"eval_overall_accuracy": 0.9646606914212548, |
|
"eval_overall_f1": 0.8363636363636363, |
|
"eval_overall_precision": 0.7931034482758621, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.734, |
|
"eval_steps_per_second": 10.263, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.745629608631134, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0376, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15535052120685577, |
|
"eval_overall_accuracy": 0.9636363636363636, |
|
"eval_overall_f1": 0.829608938547486, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2924, |
|
"eval_samples_per_second": 639.471, |
|
"eval_steps_per_second": 10.259, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 1.3148008584976196, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0389, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7480916030534351, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6712328767123288, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15534979104995728, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8328690807799444, |
|
"eval_overall_precision": 0.7868421052631579, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.704, |
|
"eval_steps_per_second": 10.247, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.5751745104789734, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0385, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7538461538461538, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6805555555555556, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1525815725326538, |
|
"eval_overall_accuracy": 0.964404609475032, |
|
"eval_overall_f1": 0.835195530726257, |
|
"eval_overall_precision": 0.791005291005291, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2918, |
|
"eval_samples_per_second": 640.799, |
|
"eval_steps_per_second": 10.28, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 1.434624195098877, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0375, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7286821705426356, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15279057621955872, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.829608938547486, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2926, |
|
"eval_samples_per_second": 639.034, |
|
"eval_steps_per_second": 10.252, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.7510130405426025, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0373, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7244094488188977, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1517334133386612, |
|
"eval_overall_accuracy": 0.964404609475032, |
|
"eval_overall_f1": 0.8330995792426368, |
|
"eval_overall_precision": 0.792, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.312, |
|
"eval_steps_per_second": 10.481, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.686745822429657, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0375, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7401574803149606, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6811594202898551, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8553459119496855, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15770980715751648, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.829608938547486, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2918, |
|
"eval_samples_per_second": 640.906, |
|
"eval_steps_per_second": 10.282, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 2.2296547889709473, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0371, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7384615384615385, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1602996438741684, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8317107093184978, |
|
"eval_overall_precision": 0.7847769028871391, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.41, |
|
"eval_steps_per_second": 10.483, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.0859251022338867, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0364, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7441860465116279, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.676056338028169, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15970273315906525, |
|
"eval_overall_accuracy": 0.9633802816901409, |
|
"eval_overall_f1": 0.8328690807799444, |
|
"eval_overall_precision": 0.7868421052631579, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2856, |
|
"eval_samples_per_second": 654.808, |
|
"eval_steps_per_second": 10.505, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.759631872177124, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0355, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15819035470485687, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8284518828451882, |
|
"eval_overall_precision": 0.783641160949868, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2921, |
|
"eval_samples_per_second": 640.257, |
|
"eval_steps_per_second": 10.271, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 3.2821595668792725, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0352, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7175572519083969, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6438356164383562, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1597450226545334, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8210818307905687, |
|
"eval_overall_precision": 0.7728459530026109, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2916, |
|
"eval_samples_per_second": 641.288, |
|
"eval_steps_per_second": 10.288, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 1.4578148126602173, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0351, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15464067459106445, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8319327731092437, |
|
"eval_overall_precision": 0.7898936170212766, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.291, |
|
"eval_samples_per_second": 642.532, |
|
"eval_steps_per_second": 10.308, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 3.6410322189331055, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0358, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7131782945736435, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15458884835243225, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8319327731092437, |
|
"eval_overall_precision": 0.7898936170212766, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2879, |
|
"eval_samples_per_second": 649.619, |
|
"eval_steps_per_second": 10.422, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.8341395854949951, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0359, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7175572519083969, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6438356164383562, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15657885372638702, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8312412831241283, |
|
"eval_overall_precision": 0.7862796833773087, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.721, |
|
"eval_steps_per_second": 10.263, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 2.221242904663086, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0338, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7086614173228347, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6521739130434783, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15500542521476746, |
|
"eval_overall_accuracy": 0.9641485275288092, |
|
"eval_overall_f1": 0.8302945301542777, |
|
"eval_overall_precision": 0.7893333333333333, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2854, |
|
"eval_samples_per_second": 655.275, |
|
"eval_steps_per_second": 10.512, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.7178964018821716, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0324, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.703125, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15786349773406982, |
|
"eval_overall_accuracy": 0.9633802816901409, |
|
"eval_overall_f1": 0.8256624825662484, |
|
"eval_overall_precision": 0.7810026385224275, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2857, |
|
"eval_samples_per_second": 654.47, |
|
"eval_steps_per_second": 10.5, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 1.6527904272079468, |
|
"learning_rate": 5e-06, |
|
"loss": 0.034, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15783792734146118, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8268156424581006, |
|
"eval_overall_precision": 0.783068783068783, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2925, |
|
"eval_samples_per_second": 639.316, |
|
"eval_steps_per_second": 10.256, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 1.0714702606201172, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0353, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7343749999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15797153115272522, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.829608938547486, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.286, |
|
"eval_samples_per_second": 653.836, |
|
"eval_steps_per_second": 10.489, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 1.2929750680923462, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0325, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15651264786720276, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8307692307692308, |
|
"eval_overall_precision": 0.7877984084880637, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 638.474, |
|
"eval_steps_per_second": 10.243, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.8345323801040649, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0344, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7343749999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1590217500925064, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8284518828451882, |
|
"eval_overall_precision": 0.783641160949868, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2919, |
|
"eval_samples_per_second": 640.648, |
|
"eval_steps_per_second": 10.278, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.6701174974441528, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0336, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7286821705426356, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1604832261800766, |
|
"eval_overall_accuracy": 0.9633802816901409, |
|
"eval_overall_f1": 0.8256624825662484, |
|
"eval_overall_precision": 0.7810026385224275, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.822, |
|
"eval_steps_per_second": 10.473, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.5713714361190796, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0337, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7244094488188977, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.16034719347953796, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.829608938547486, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2857, |
|
"eval_samples_per_second": 654.607, |
|
"eval_steps_per_second": 10.502, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 1.4332071542739868, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0326, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.703125, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1593874990940094, |
|
"eval_overall_accuracy": 0.9633802816901409, |
|
"eval_overall_f1": 0.8256624825662484, |
|
"eval_overall_precision": 0.7810026385224275, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2921, |
|
"eval_samples_per_second": 640.143, |
|
"eval_steps_per_second": 10.27, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 1.3420923948287964, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0352, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7244094488188977, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15942679345607758, |
|
"eval_overall_accuracy": 0.9641485275288092, |
|
"eval_overall_f1": 0.8307692307692308, |
|
"eval_overall_precision": 0.7877984084880637, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2927, |
|
"eval_samples_per_second": 638.801, |
|
"eval_steps_per_second": 10.248, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 2.652052402496338, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0329, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7343749999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1578895002603531, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8307692307692308, |
|
"eval_overall_precision": 0.7877984084880637, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2858, |
|
"eval_samples_per_second": 654.385, |
|
"eval_steps_per_second": 10.498, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 1.3167122602462769, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0321, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6857142857142857, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15904921293258667, |
|
"eval_overall_accuracy": 0.9641485275288092, |
|
"eval_overall_f1": 0.8324022346368716, |
|
"eval_overall_precision": 0.7883597883597884, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.293, |
|
"eval_samples_per_second": 638.168, |
|
"eval_steps_per_second": 10.238, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.26482483744621277, |
|
"learning_rate": 0.0, |
|
"loss": 0.0322, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7343749999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1596968173980713, |
|
"eval_overall_accuracy": 0.9638924455825865, |
|
"eval_overall_f1": 0.8284518828451882, |
|
"eval_overall_precision": 0.783641160949868, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2913, |
|
"eval_samples_per_second": 641.846, |
|
"eval_steps_per_second": 10.297, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 4535639530574946.0, |
|
"train_loss": 0.08503569045156803, |
|
"train_runtime": 606.7172, |
|
"train_samples_per_second": 278.054, |
|
"train_steps_per_second": 17.471 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 4535639530574946.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|