|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 2.184743642807007, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9441, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.013071895424836602, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.3333333333333333, |
|
"eval_PERSON_recall": 0.006666666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.6184682846069336, |
|
"eval_overall_accuracy": 0.8414161008729389, |
|
"eval_overall_f1": 0.005714285714285714, |
|
"eval_overall_precision": 0.3333333333333333, |
|
"eval_overall_recall": 0.002881844380403458, |
|
"eval_runtime": 0.3392, |
|
"eval_samples_per_second": 551.333, |
|
"eval_steps_per_second": 8.845, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.0305746793746948, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.5645, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.22916666666666669, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.44, |
|
"eval_LOCATION_recall": 0.15492957746478872, |
|
"eval_ORGANIZATION_f1": 0.04, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.05714285714285714, |
|
"eval_ORGANIZATION_recall": 0.03076923076923077, |
|
"eval_PERSON_f1": 0.5449438202247192, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.470873786407767, |
|
"eval_PERSON_recall": 0.6466666666666666, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.43478260869565216, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.5555555555555556, |
|
"eval_TIME_recall": 0.35714285714285715, |
|
"eval_loss": 0.41943466663360596, |
|
"eval_overall_accuracy": 0.8877303588748787, |
|
"eval_overall_f1": 0.3803486529318542, |
|
"eval_overall_precision": 0.4225352112676056, |
|
"eval_overall_recall": 0.345821325648415, |
|
"eval_runtime": 0.3288, |
|
"eval_samples_per_second": 568.708, |
|
"eval_steps_per_second": 9.124, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.2039958238601685, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.3968, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.5153374233128835, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.45652173913043476, |
|
"eval_LOCATION_recall": 0.5915492957746479, |
|
"eval_ORGANIZATION_f1": 0.3278688524590164, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.3508771929824561, |
|
"eval_ORGANIZATION_recall": 0.3076923076923077, |
|
"eval_PERSON_f1": 0.6829268292682927, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.5753424657534246, |
|
"eval_PERSON_recall": 0.84, |
|
"eval_QUANTITY_f1": 0.1846153846153846, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.1875, |
|
"eval_QUANTITY_recall": 0.18181818181818182, |
|
"eval_TIME_f1": 0.8076923076923077, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.875, |
|
"eval_TIME_recall": 0.75, |
|
"eval_loss": 0.30941861867904663, |
|
"eval_overall_accuracy": 0.9202230843840931, |
|
"eval_overall_f1": 0.5577172503242542, |
|
"eval_overall_precision": 0.5070754716981132, |
|
"eval_overall_recall": 0.6195965417867435, |
|
"eval_runtime": 0.3381, |
|
"eval_samples_per_second": 553.069, |
|
"eval_steps_per_second": 8.873, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 4.7056145668029785, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2937, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.5465116279069767, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.46534653465346537, |
|
"eval_LOCATION_recall": 0.6619718309859155, |
|
"eval_ORGANIZATION_f1": 0.4878048780487805, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5172413793103449, |
|
"eval_ORGANIZATION_recall": 0.46153846153846156, |
|
"eval_PERSON_f1": 0.8036809815950918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7443181818181818, |
|
"eval_PERSON_recall": 0.8733333333333333, |
|
"eval_QUANTITY_f1": 0.47368421052631576, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.4186046511627907, |
|
"eval_QUANTITY_recall": 0.5454545454545454, |
|
"eval_TIME_f1": 0.8363636363636364, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8518518518518519, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.2222605049610138, |
|
"eval_overall_accuracy": 0.9369544131910766, |
|
"eval_overall_f1": 0.6622340425531915, |
|
"eval_overall_precision": 0.6148148148148148, |
|
"eval_overall_recall": 0.7175792507204611, |
|
"eval_runtime": 0.3282, |
|
"eval_samples_per_second": 569.698, |
|
"eval_steps_per_second": 9.14, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.303191900253296, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.2294, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.6496815286624205, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5930232558139535, |
|
"eval_LOCATION_recall": 0.7183098591549296, |
|
"eval_ORGANIZATION_f1": 0.562962962962963, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5428571428571428, |
|
"eval_ORGANIZATION_recall": 0.5846153846153846, |
|
"eval_PERSON_f1": 0.8176100628930819, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7738095238095238, |
|
"eval_PERSON_recall": 0.8666666666666667, |
|
"eval_QUANTITY_f1": 0.5316455696202532, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.45652173913043476, |
|
"eval_QUANTITY_recall": 0.6363636363636364, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.18041133880615234, |
|
"eval_overall_accuracy": 0.9427740058195926, |
|
"eval_overall_f1": 0.7106325706594886, |
|
"eval_overall_precision": 0.6666666666666666, |
|
"eval_overall_recall": 0.760806916426513, |
|
"eval_runtime": 0.3291, |
|
"eval_samples_per_second": 568.165, |
|
"eval_steps_per_second": 9.115, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.6567788124084473, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1955, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7052023121387284, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5980392156862745, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.5903614457831325, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.48514851485148514, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8109756097560976, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7471910112359551, |
|
"eval_PERSON_recall": 0.8866666666666667, |
|
"eval_QUANTITY_f1": 0.5517241379310345, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.4444444444444444, |
|
"eval_QUANTITY_recall": 0.7272727272727273, |
|
"eval_TIME_f1": 0.793103448275862, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7666666666666667, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.19565138220787048, |
|
"eval_overall_accuracy": 0.9396217264791464, |
|
"eval_overall_f1": 0.7142857142857143, |
|
"eval_overall_precision": 0.6236559139784946, |
|
"eval_overall_recall": 0.8357348703170029, |
|
"eval_runtime": 0.3291, |
|
"eval_samples_per_second": 568.21, |
|
"eval_steps_per_second": 9.116, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 2.8131422996520996, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1799, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7374999999999999, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6629213483146067, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.6482758620689656, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5875, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.81875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7705882352941177, |
|
"eval_PERSON_recall": 0.8733333333333333, |
|
"eval_QUANTITY_f1": 0.6585365853658536, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5510204081632653, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16057299077510834, |
|
"eval_overall_accuracy": 0.9468962172647915, |
|
"eval_overall_f1": 0.7529411764705883, |
|
"eval_overall_precision": 0.6889952153110048, |
|
"eval_overall_recall": 0.829971181556196, |
|
"eval_runtime": 0.3295, |
|
"eval_samples_per_second": 567.569, |
|
"eval_steps_per_second": 9.105, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.7265537977218628, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1628, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7349397590361445, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6421052631578947, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.6451612903225806, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5555555555555556, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8275862068965518, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7810650887573964, |
|
"eval_PERSON_recall": 0.88, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15270720422267914, |
|
"eval_overall_accuracy": 0.9510184287099903, |
|
"eval_overall_f1": 0.7587096774193549, |
|
"eval_overall_precision": 0.6869158878504673, |
|
"eval_overall_recall": 0.8472622478386167, |
|
"eval_runtime": 0.3291, |
|
"eval_samples_per_second": 568.147, |
|
"eval_steps_per_second": 9.115, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.15663743019104, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1528, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7564102564102564, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6941176470588235, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.6351351351351351, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5662650602409639, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8397435897435898, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.808641975308642, |
|
"eval_PERSON_recall": 0.8733333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14164027571678162, |
|
"eval_overall_accuracy": 0.9522308438409312, |
|
"eval_overall_f1": 0.7727272727272728, |
|
"eval_overall_precision": 0.7206982543640897, |
|
"eval_overall_recall": 0.8328530259365994, |
|
"eval_runtime": 0.3351, |
|
"eval_samples_per_second": 558.073, |
|
"eval_steps_per_second": 8.953, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.8798385858535767, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1466, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7307692307692307, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6705882352941176, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.625, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.569620253164557, |
|
"eval_ORGANIZATION_recall": 0.6923076923076923, |
|
"eval_PERSON_f1": 0.8387096774193549, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8125, |
|
"eval_PERSON_recall": 0.8666666666666667, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14073340594768524, |
|
"eval_overall_accuracy": 0.9522308438409312, |
|
"eval_overall_f1": 0.7661290322580645, |
|
"eval_overall_precision": 0.7178841309823678, |
|
"eval_overall_recall": 0.8213256484149856, |
|
"eval_runtime": 0.3345, |
|
"eval_samples_per_second": 559.032, |
|
"eval_steps_per_second": 8.968, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.9395531415939331, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.138, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.775, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5975609756097561, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8360128617363344, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8074534161490683, |
|
"eval_PERSON_recall": 0.8666666666666667, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14058995246887207, |
|
"eval_overall_accuracy": 0.9536857419980601, |
|
"eval_overall_f1": 0.7819148936170213, |
|
"eval_overall_precision": 0.725925925925926, |
|
"eval_overall_recall": 0.8472622478386167, |
|
"eval_runtime": 0.3303, |
|
"eval_samples_per_second": 566.135, |
|
"eval_steps_per_second": 9.082, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.2153416872024536, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1314, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.775, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6578947368421053, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5747126436781609, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8407643312101911, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8048780487804879, |
|
"eval_PERSON_recall": 0.88, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14196860790252686, |
|
"eval_overall_accuracy": 0.953443258971872, |
|
"eval_overall_f1": 0.7769028871391075, |
|
"eval_overall_precision": 0.7132530120481928, |
|
"eval_overall_recall": 0.8530259365994236, |
|
"eval_runtime": 0.3295, |
|
"eval_samples_per_second": 567.586, |
|
"eval_steps_per_second": 9.106, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.6423377990722656, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1285, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.7261146496815286, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6627906976744186, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.6493506493506495, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5617977528089888, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8461538461538461, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8148148148148148, |
|
"eval_PERSON_recall": 0.88, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13416315615177155, |
|
"eval_overall_accuracy": 0.954898157129001, |
|
"eval_overall_f1": 0.7755644090305446, |
|
"eval_overall_precision": 0.7192118226600985, |
|
"eval_overall_recall": 0.8414985590778098, |
|
"eval_runtime": 0.3353, |
|
"eval_samples_per_second": 557.743, |
|
"eval_steps_per_second": 8.948, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 3.325246572494507, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1301, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.5915492957746479, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5454545454545454, |
|
"eval_ORGANIZATION_recall": 0.6461538461538462, |
|
"eval_PERSON_f1": 0.8488745980707395, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8198757763975155, |
|
"eval_PERSON_recall": 0.88, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12784981727600098, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.778833107191316, |
|
"eval_overall_precision": 0.735897435897436, |
|
"eval_overall_recall": 0.8270893371757925, |
|
"eval_runtime": 0.3291, |
|
"eval_samples_per_second": 568.237, |
|
"eval_steps_per_second": 9.116, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.1983723640441895, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1197, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.779874213836478, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7045454545454546, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7012987012987013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6067415730337079, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8471337579617835, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8109756097560976, |
|
"eval_PERSON_recall": 0.8866666666666667, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1395217925310135, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.7874015748031495, |
|
"eval_overall_precision": 0.7228915662650602, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.3284, |
|
"eval_samples_per_second": 569.403, |
|
"eval_steps_per_second": 9.135, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 2.9908885955810547, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1147, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6853146853146853, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6282051282051282, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8461538461538461, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8148148148148148, |
|
"eval_PERSON_recall": 0.88, |
|
"eval_QUANTITY_f1": 0.7088607594936709, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6086956521739131, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13548891246318817, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.787716955941255, |
|
"eval_overall_precision": 0.7338308457711443, |
|
"eval_overall_recall": 0.8501440922190202, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.383, |
|
"eval_steps_per_second": 8.974, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.7757030129432678, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.1134, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.6618705035971223, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.8498402555910542, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8159509202453987, |
|
"eval_PERSON_recall": 0.8866666666666667, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12935349345207214, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.7875507442489851, |
|
"eval_overall_precision": 0.7423469387755102, |
|
"eval_overall_recall": 0.8386167146974063, |
|
"eval_runtime": 0.3301, |
|
"eval_samples_per_second": 566.53, |
|
"eval_steps_per_second": 9.089, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 1.1819586753845215, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.1103, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7162162162162162, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6385542168674698, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8507936507936508, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8121212121212121, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13496747612953186, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8015978695073236, |
|
"eval_overall_precision": 0.745049504950495, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3289, |
|
"eval_samples_per_second": 568.537, |
|
"eval_steps_per_second": 9.121, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 1.253257393836975, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.1078, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7162162162162162, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6385542168674698, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8498402555910542, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8159509202453987, |
|
"eval_PERSON_recall": 0.8866666666666667, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13079425692558289, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.7999999999999999, |
|
"eval_overall_precision": 0.7487437185929648, |
|
"eval_overall_recall": 0.8587896253602305, |
|
"eval_runtime": 0.3341, |
|
"eval_samples_per_second": 559.714, |
|
"eval_steps_per_second": 8.979, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 1.522292137145996, |
|
"learning_rate": 4e-05, |
|
"loss": 0.1051, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6814814814814816, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.858974358974359, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8271604938271605, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12830358743667603, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8054794520547945, |
|
"eval_overall_precision": 0.7676240208877284, |
|
"eval_overall_recall": 0.8472622478386167, |
|
"eval_runtime": 0.3284, |
|
"eval_samples_per_second": 569.369, |
|
"eval_steps_per_second": 9.134, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 1.3046311140060425, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.1013, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7210884353741497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6463414634146342, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8507936507936508, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8121212121212121, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1330733597278595, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8048128342245989, |
|
"eval_overall_precision": 0.7506234413965087, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.335, |
|
"eval_samples_per_second": 558.137, |
|
"eval_steps_per_second": 8.954, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 1.648231863975525, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.1015, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.7625, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6853932584269663, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7044025157232704, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5957446808510638, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8481012658227848, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8072289156626506, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1461816430091858, |
|
"eval_overall_accuracy": 0.9529582929194956, |
|
"eval_overall_f1": 0.7900912646675358, |
|
"eval_overall_precision": 0.7214285714285714, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3294, |
|
"eval_samples_per_second": 567.654, |
|
"eval_steps_per_second": 9.107, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.236881136894226, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0952, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7375886524822695, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6842105263157895, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8525641025641025, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8209876543209876, |
|
"eval_PERSON_recall": 0.8866666666666667, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12616348266601562, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8180574555403557, |
|
"eval_overall_precision": 0.7786458333333334, |
|
"eval_overall_recall": 0.861671469740634, |
|
"eval_runtime": 0.3359, |
|
"eval_samples_per_second": 556.671, |
|
"eval_steps_per_second": 8.931, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.727121353149414, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0957, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7105263157894737, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6206896551724138, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8454258675078864, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8023952095808383, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14105214178562164, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.7962962962962963, |
|
"eval_overall_precision": 0.7359413202933985, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3291, |
|
"eval_samples_per_second": 568.152, |
|
"eval_steps_per_second": 9.115, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 1.6316332817077637, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0913, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7534246575342466, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6790123456790124, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8544303797468354, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6363636363636364, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13811782002449036, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8117489986648865, |
|
"eval_overall_precision": 0.7562189054726368, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3289, |
|
"eval_samples_per_second": 568.489, |
|
"eval_steps_per_second": 9.12, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.5518941879272461, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.091, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7361111111111112, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6708860759493671, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8643533123028392, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7179487179487178, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6222222222222222, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13771426677703857, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.808, |
|
"eval_overall_precision": 0.7518610421836228, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.442, |
|
"eval_steps_per_second": 8.975, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.4636467695236206, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0902, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7248322147651007, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8517350157728706, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8083832335329342, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6582278481012658, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5652173913043478, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14399109780788422, |
|
"eval_overall_accuracy": 0.9546556741028128, |
|
"eval_overall_f1": 0.7894736842105263, |
|
"eval_overall_precision": 0.7263922518159807, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.3358, |
|
"eval_samples_per_second": 556.812, |
|
"eval_steps_per_second": 8.933, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 1.3473738431930542, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.087, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.794701986754967, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7142857142857143, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6179775280898876, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8626198083067093, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1355486363172531, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8118279569892473, |
|
"eval_overall_precision": 0.760705289672544, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3366, |
|
"eval_samples_per_second": 555.494, |
|
"eval_steps_per_second": 8.912, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.5319921970367432, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0849, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.6923076923076923, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5934065934065934, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8507936507936508, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8121212121212121, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13350827991962433, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.7989347536617842, |
|
"eval_overall_precision": 0.7425742574257426, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.3368, |
|
"eval_samples_per_second": 555.248, |
|
"eval_steps_per_second": 8.908, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 1.0683906078338623, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0815, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7310344827586207, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6625, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13375303149223328, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8184281842818427, |
|
"eval_overall_precision": 0.7723785166240409, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3368, |
|
"eval_samples_per_second": 555.175, |
|
"eval_steps_per_second": 8.907, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.8525239825248718, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0838, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7333333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13723136484622955, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8133333333333335, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.334, |
|
"eval_samples_per_second": 559.823, |
|
"eval_steps_per_second": 8.981, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 1.4616408348083496, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.076, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.708860759493671, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6021505376344086, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8643533123028392, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7088607594936709, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6086956521739131, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1504770815372467, |
|
"eval_overall_accuracy": 0.954898157129001, |
|
"eval_overall_f1": 0.7989556135770235, |
|
"eval_overall_precision": 0.7303102625298329, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3282, |
|
"eval_samples_per_second": 569.822, |
|
"eval_steps_per_second": 9.142, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 2.1258466243743896, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0775, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.72992700729927, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6944444444444444, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13078542053699493, |
|
"eval_overall_accuracy": 0.9633850630455868, |
|
"eval_overall_f1": 0.8264462809917356, |
|
"eval_overall_precision": 0.7915567282321899, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.3348, |
|
"eval_samples_per_second": 558.49, |
|
"eval_steps_per_second": 8.96, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.6660958528518677, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0768, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8681672025723473, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8385093167701864, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13354364037513733, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8254397834912043, |
|
"eval_overall_precision": 0.7780612244897959, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3339, |
|
"eval_samples_per_second": 560.029, |
|
"eval_steps_per_second": 8.984, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.7892407774925232, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0746, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7549668874172185, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1393873244524002, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8225806451612904, |
|
"eval_overall_precision": 0.7707808564231738, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3337, |
|
"eval_samples_per_second": 560.376, |
|
"eval_steps_per_second": 8.99, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 1.38412344455719, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0724, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7051282051282052, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6043956043956044, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8589341692789968, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8106508875739645, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14194774627685547, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8110964332892999, |
|
"eval_overall_precision": 0.748780487804878, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3344, |
|
"eval_samples_per_second": 559.292, |
|
"eval_steps_per_second": 8.973, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 1.6571606397628784, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0703, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.7672955974842768, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6931818181818182, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.708860759493671, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6021505376344086, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15663577616214752, |
|
"eval_overall_accuracy": 0.9517458777885548, |
|
"eval_overall_f1": 0.7973856209150326, |
|
"eval_overall_precision": 0.7296650717703349, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3366, |
|
"eval_samples_per_second": 555.525, |
|
"eval_steps_per_second": 8.912, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.8099401593208313, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.07, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6835443037974683, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5869565217391305, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14580821990966797, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8090185676392573, |
|
"eval_overall_precision": 0.7493857493857494, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3346, |
|
"eval_samples_per_second": 558.844, |
|
"eval_steps_per_second": 8.965, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 1.7465280294418335, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0688, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.713375796178344, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14488695561885834, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8158940397350992, |
|
"eval_overall_precision": 0.7549019607843137, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3336, |
|
"eval_samples_per_second": 560.471, |
|
"eval_steps_per_second": 8.992, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.8754693269729614, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0691, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13563859462738037, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8281461434370772, |
|
"eval_overall_precision": 0.7806122448979592, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3295, |
|
"eval_samples_per_second": 567.559, |
|
"eval_steps_per_second": 9.105, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.3340809941291809, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0673, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.6962025316455697, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5913978494623656, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15314164757728577, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.7958115183246073, |
|
"eval_overall_precision": 0.7290167865707434, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3349, |
|
"eval_samples_per_second": 558.392, |
|
"eval_steps_per_second": 8.958, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.9933107495307922, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0663, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8653846153846153, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8333333333333334, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1424974650144577, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8144192256341789, |
|
"eval_overall_precision": 0.7587064676616916, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3341, |
|
"eval_samples_per_second": 559.709, |
|
"eval_steps_per_second": 8.979, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.6678488254547119, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0639, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7285714285714285, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.68, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8562300319488818, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8220858895705522, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1413319855928421, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8113975576662144, |
|
"eval_overall_precision": 0.7666666666666667, |
|
"eval_overall_recall": 0.861671469740634, |
|
"eval_runtime": 0.3285, |
|
"eval_samples_per_second": 569.242, |
|
"eval_steps_per_second": 9.132, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.8438284993171692, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.064, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7152317880794703, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14022959768772125, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8187919463087249, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3337, |
|
"eval_samples_per_second": 560.437, |
|
"eval_steps_per_second": 8.991, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 3.699862241744995, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0615, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7189542483660131, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15338602662086487, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.8042328042328041, |
|
"eval_overall_precision": 0.7432762836185819, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.329, |
|
"eval_samples_per_second": 568.326, |
|
"eval_steps_per_second": 9.118, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.7766585946083069, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0614, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7236842105263158, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.632183908045977, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14268124103546143, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8221024258760108, |
|
"eval_overall_precision": 0.7721518987341772, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.326, |
|
"eval_steps_per_second": 8.973, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 1.664536476135254, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0595, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.154044508934021, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8174603174603176, |
|
"eval_overall_precision": 0.7555012224938875, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3363, |
|
"eval_samples_per_second": 555.98, |
|
"eval_steps_per_second": 8.919, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 1.3004956245422363, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0594, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7189542483660131, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8690095846645367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1491357684135437, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8154050464807437, |
|
"eval_overall_precision": 0.7561576354679803, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3302, |
|
"eval_samples_per_second": 566.352, |
|
"eval_steps_per_second": 9.086, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 1.524907112121582, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0579, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.697986577181208, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6190476190476191, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8726114649681529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14881013333797455, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8095872170439414, |
|
"eval_overall_precision": 0.7524752475247525, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3347, |
|
"eval_samples_per_second": 558.754, |
|
"eval_steps_per_second": 8.964, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 1.4106496572494507, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0561, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6933333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.611764705882353, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1435040831565857, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8151147098515519, |
|
"eval_overall_precision": 0.766497461928934, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3346, |
|
"eval_samples_per_second": 558.815, |
|
"eval_steps_per_second": 8.965, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.9782974123954773, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.056, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6891891891891891, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6144578313253012, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15163768827915192, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.808, |
|
"eval_overall_precision": 0.7518610421836228, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3285, |
|
"eval_samples_per_second": 569.298, |
|
"eval_steps_per_second": 9.133, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.8598395586013794, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0547, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.870967741935484, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84375, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15105435252189636, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8091397849462366, |
|
"eval_overall_precision": 0.7581863979848866, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3341, |
|
"eval_samples_per_second": 559.773, |
|
"eval_steps_per_second": 8.98, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 1.4993176460266113, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0534, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.713375796178344, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16154761612415314, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.8068331143232589, |
|
"eval_overall_precision": 0.7415458937198067, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3295, |
|
"eval_samples_per_second": 567.521, |
|
"eval_steps_per_second": 9.105, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 1.0407500267028809, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0526, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6967741935483871, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15213675796985626, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8155080213903744, |
|
"eval_overall_precision": 0.7605985037406484, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3348, |
|
"eval_samples_per_second": 558.56, |
|
"eval_steps_per_second": 8.961, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.6406387686729431, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0538, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.7875000000000001, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7078651685393258, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7051282051282052, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6043956043956044, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15997092425823212, |
|
"eval_overall_accuracy": 0.9551406401551892, |
|
"eval_overall_f1": 0.8015768725361366, |
|
"eval_overall_precision": 0.7367149758454107, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3348, |
|
"eval_samples_per_second": 558.524, |
|
"eval_steps_per_second": 8.96, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 2.387361526489258, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0529, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7096774193548387, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6111111111111112, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8726114649681529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1578657031059265, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8095238095238096, |
|
"eval_overall_precision": 0.7481662591687042, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.336, |
|
"eval_samples_per_second": 556.493, |
|
"eval_steps_per_second": 8.928, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 1.3003697395324707, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.05, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6950354609929077, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6447368421052632, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14940249919891357, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8185538881309686, |
|
"eval_overall_precision": 0.7772020725388601, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.3282, |
|
"eval_samples_per_second": 569.855, |
|
"eval_steps_per_second": 9.142, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.7399232387542725, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0512, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7042253521126761, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6493506493506493, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14740602672100067, |
|
"eval_overall_accuracy": 0.9597478176527643, |
|
"eval_overall_f1": 0.8163265306122449, |
|
"eval_overall_precision": 0.7731958762886598, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.335, |
|
"eval_samples_per_second": 558.203, |
|
"eval_steps_per_second": 8.955, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 1.4280949831008911, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.047, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.7848101265822784, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7248322147651007, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15319204330444336, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8187919463087249, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3345, |
|
"eval_samples_per_second": 558.972, |
|
"eval_steps_per_second": 8.967, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 1.479651689529419, |
|
"learning_rate": 2e-05, |
|
"loss": 0.047, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7096774193548387, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6111111111111112, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.870967741935484, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84375, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15390989184379578, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8176943699731903, |
|
"eval_overall_precision": 0.7644110275689223, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3361, |
|
"eval_samples_per_second": 556.409, |
|
"eval_steps_per_second": 8.926, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.868341326713562, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0465, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7105263157894737, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6206896551724138, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8726114649681529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15987202525138855, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.816, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3357, |
|
"eval_samples_per_second": 557.069, |
|
"eval_steps_per_second": 8.937, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 1.9663652181625366, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.045, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1569298505783081, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8176943699731903, |
|
"eval_overall_precision": 0.7644110275689223, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.334, |
|
"eval_samples_per_second": 559.847, |
|
"eval_steps_per_second": 8.982, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 4.453447341918945, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0468, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7114093959731543, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6309523809523809, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.870967741935484, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84375, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1518780142068863, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8195386702849389, |
|
"eval_overall_precision": 0.7743589743589744, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3347, |
|
"eval_samples_per_second": 558.764, |
|
"eval_steps_per_second": 8.964, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.6715424656867981, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0446, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15471045672893524, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8201634877384196, |
|
"eval_overall_precision": 0.7777777777777778, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3347, |
|
"eval_samples_per_second": 558.76, |
|
"eval_steps_per_second": 8.964, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.4069435596466064, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0452, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7051282051282052, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6043956043956044, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16312921047210693, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8149134487350199, |
|
"eval_overall_precision": 0.7574257425742574, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3337, |
|
"eval_samples_per_second": 560.419, |
|
"eval_steps_per_second": 8.991, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.9711624383926392, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0442, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7051282051282052, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6043956043956044, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1615941822528839, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8175765645805593, |
|
"eval_overall_precision": 0.7599009900990099, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3285, |
|
"eval_samples_per_second": 569.32, |
|
"eval_steps_per_second": 9.133, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.3948928415775299, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0431, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.7898089171974522, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8690095846645367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16082525253295898, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8117489986648865, |
|
"eval_overall_precision": 0.7562189054726368, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3338, |
|
"eval_samples_per_second": 560.26, |
|
"eval_steps_per_second": 8.988, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 1.975942611694336, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0427, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7142857142857143, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6179775280898876, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8690095846645367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16873115301132202, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8047493403693932, |
|
"eval_overall_precision": 0.7420924574209246, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3298, |
|
"eval_samples_per_second": 567.09, |
|
"eval_steps_per_second": 9.098, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.47350606322288513, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.043, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7012987012987013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6067415730337079, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16365033388137817, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8138297872340426, |
|
"eval_overall_precision": 0.7555555555555555, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3349, |
|
"eval_samples_per_second": 558.297, |
|
"eval_steps_per_second": 8.957, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.45649945735931396, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0426, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6136363636363636, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16292014718055725, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.816, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3342, |
|
"eval_samples_per_second": 559.604, |
|
"eval_steps_per_second": 8.978, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 2.033871650695801, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0439, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.775, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7080745341614907, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.59375, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7631578947368421, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6744186046511628, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1787422150373459, |
|
"eval_overall_accuracy": 0.9541707080504365, |
|
"eval_overall_f1": 0.81151832460733, |
|
"eval_overall_precision": 0.7434052757793765, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3358, |
|
"eval_samples_per_second": 556.823, |
|
"eval_steps_per_second": 8.933, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 1.839992642402649, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0409, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7105263157894737, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6206896551724138, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16144876182079315, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8172043010752689, |
|
"eval_overall_precision": 0.7657430730478589, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3288, |
|
"eval_samples_per_second": 568.779, |
|
"eval_steps_per_second": 9.125, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.7383960485458374, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0404, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6928104575163399, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6022727272727273, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16545303165912628, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8122503328894807, |
|
"eval_overall_precision": 0.754950495049505, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3357, |
|
"eval_samples_per_second": 557.128, |
|
"eval_steps_per_second": 8.938, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.1772239208221436, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0399, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16691727936267853, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8133333333333335, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 570.978, |
|
"eval_steps_per_second": 9.16, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.3011506497859955, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.04, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7105263157894737, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6206896551724138, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16395699977874756, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8181818181818181, |
|
"eval_overall_precision": 0.7630922693266833, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3338, |
|
"eval_samples_per_second": 560.152, |
|
"eval_steps_per_second": 8.986, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 1.2410697937011719, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0402, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7012987012987013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6067415730337079, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16832870244979858, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8127490039840637, |
|
"eval_overall_precision": 0.7536945812807881, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3293, |
|
"eval_samples_per_second": 567.933, |
|
"eval_steps_per_second": 9.111, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 1.8908904790878296, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0402, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.7875000000000001, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7078651685393258, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7066666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6235294117647059, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8690095846645367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17024052143096924, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8095872170439414, |
|
"eval_overall_precision": 0.7524752475247525, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3354, |
|
"eval_samples_per_second": 557.526, |
|
"eval_steps_per_second": 8.944, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.9162412881851196, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0379, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6928104575163399, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6022727272727273, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8653846153846153, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8333333333333334, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16936184465885162, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8095872170439414, |
|
"eval_overall_precision": 0.7524752475247525, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3352, |
|
"eval_samples_per_second": 557.918, |
|
"eval_steps_per_second": 8.951, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.6435752511024475, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0371, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1731194704771042, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8100929614873836, |
|
"eval_overall_precision": 0.7512315270935961, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3345, |
|
"eval_samples_per_second": 559.06, |
|
"eval_steps_per_second": 8.969, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.5504117608070374, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0375, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.8025477707006369, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17014098167419434, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8144192256341789, |
|
"eval_overall_precision": 0.7587064676616916, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.339, |
|
"eval_steps_per_second": 8.973, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.46581876277923584, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0367, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.7898089171974522, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8726114649681529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16831910610198975, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8100929614873836, |
|
"eval_overall_precision": 0.7512315270935961, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3306, |
|
"eval_samples_per_second": 565.697, |
|
"eval_steps_per_second": 9.075, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.1437621116638184, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0369, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6794871794871795, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5824175824175825, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17457380890846252, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8132450331125827, |
|
"eval_overall_precision": 0.7524509803921569, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3281, |
|
"eval_samples_per_second": 569.937, |
|
"eval_steps_per_second": 9.143, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 1.673567771911621, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0382, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.7848101265822784, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8690095846645367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16617552936077118, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8106666666666668, |
|
"eval_overall_precision": 0.7543424317617866, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3288, |
|
"eval_samples_per_second": 568.811, |
|
"eval_steps_per_second": 9.125, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.8704581260681152, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0376, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16935382783412933, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8133333333333335, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3375, |
|
"eval_samples_per_second": 554.036, |
|
"eval_steps_per_second": 8.888, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 2.838458299636841, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0372, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7006369426751592, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5978260869565217, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17407700419425964, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8143236074270557, |
|
"eval_overall_precision": 0.7542997542997543, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3278, |
|
"eval_samples_per_second": 570.491, |
|
"eval_steps_per_second": 9.152, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.5828319191932678, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0351, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6928104575163399, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6022727272727273, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17182248830795288, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8111702127659575, |
|
"eval_overall_precision": 0.7530864197530864, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3288, |
|
"eval_samples_per_second": 568.789, |
|
"eval_steps_per_second": 9.125, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.9350789189338684, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0348, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6838709677419356, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5888888888888889, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17128072679042816, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8100929614873836, |
|
"eval_overall_precision": 0.7512315270935961, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3283, |
|
"eval_samples_per_second": 569.617, |
|
"eval_steps_per_second": 9.138, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 1.2203199863433838, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0363, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17074672877788544, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8144192256341789, |
|
"eval_overall_precision": 0.7587064676616916, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3349, |
|
"eval_samples_per_second": 558.334, |
|
"eval_steps_per_second": 8.957, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.67624431848526, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0371, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17176063358783722, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8116710875331565, |
|
"eval_overall_precision": 0.7518427518427518, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3296, |
|
"eval_samples_per_second": 567.418, |
|
"eval_steps_per_second": 9.103, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 1.9259661436080933, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0367, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8025477707006369, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17073224484920502, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.820855614973262, |
|
"eval_overall_precision": 0.7655860349127181, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3289, |
|
"eval_samples_per_second": 568.538, |
|
"eval_steps_per_second": 9.121, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.5366353392601013, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0349, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7096774193548387, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6111111111111112, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17369931936264038, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8154050464807437, |
|
"eval_overall_precision": 0.7561576354679803, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3356, |
|
"eval_samples_per_second": 557.153, |
|
"eval_steps_per_second": 8.938, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.7619331479072571, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0357, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8025477707006369, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7066666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6235294117647059, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16904906928539276, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8192771084337349, |
|
"eval_overall_precision": 0.765, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3298, |
|
"eval_samples_per_second": 567.039, |
|
"eval_steps_per_second": 9.097, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.7772564888000488, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0345, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17138922214508057, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8170894526034712, |
|
"eval_overall_precision": 0.7611940298507462, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3291, |
|
"eval_samples_per_second": 568.133, |
|
"eval_steps_per_second": 9.114, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 1.5932378768920898, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0349, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6838709677419356, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5888888888888889, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1765890270471573, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8138297872340426, |
|
"eval_overall_precision": 0.7555555555555555, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3307, |
|
"eval_samples_per_second": 565.487, |
|
"eval_steps_per_second": 9.072, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.8269696235656738, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0352, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6838709677419356, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5888888888888889, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17644113302230835, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8127490039840637, |
|
"eval_overall_precision": 0.7536945812807881, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3354, |
|
"eval_samples_per_second": 557.581, |
|
"eval_steps_per_second": 8.945, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 1.2851319313049316, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0367, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17299894988536835, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.816, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3376, |
|
"eval_samples_per_second": 553.982, |
|
"eval_steps_per_second": 8.887, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 1.469909906387329, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0352, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6928104575163399, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6022727272727273, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1724460870027542, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8170894526034712, |
|
"eval_overall_precision": 0.7611940298507462, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3347, |
|
"eval_samples_per_second": 558.712, |
|
"eval_steps_per_second": 8.963, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.9896478652954102, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0341, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6794871794871795, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5824175824175825, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1747630089521408, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8100929614873836, |
|
"eval_overall_precision": 0.7512315270935961, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3294, |
|
"eval_samples_per_second": 567.729, |
|
"eval_steps_per_second": 9.108, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 1.395708441734314, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0331, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6928104575163399, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6022727272727273, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17256887257099152, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8133333333333335, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3298, |
|
"eval_samples_per_second": 567.096, |
|
"eval_steps_per_second": 9.098, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.4935811758041382, |
|
"learning_rate": 0.0, |
|
"loss": 0.0347, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6928104575163399, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6022727272727273, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17283295094966888, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8133333333333335, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.33, |
|
"eval_samples_per_second": 566.66, |
|
"eval_steps_per_second": 9.091, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 4639858441347408.0, |
|
"train_loss": 0.08816910017211482, |
|
"train_runtime": 595.5845, |
|
"train_samples_per_second": 283.419, |
|
"train_steps_per_second": 17.798 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 4639858441347408.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|