{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.184743642807007, "learning_rate": 4.9500000000000004e-05, "loss": 0.9441, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.013071895424836602, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.3333333333333333, "eval_PERSON_recall": 0.006666666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 28, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.6184682846069336, "eval_overall_accuracy": 0.8414161008729389, "eval_overall_f1": 0.005714285714285714, "eval_overall_precision": 0.3333333333333333, "eval_overall_recall": 0.002881844380403458, "eval_runtime": 0.3392, "eval_samples_per_second": 551.333, "eval_steps_per_second": 8.845, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.0305746793746948, "learning_rate": 4.9e-05, "loss": 0.5645, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.22916666666666669, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.44, "eval_LOCATION_recall": 0.15492957746478872, "eval_ORGANIZATION_f1": 0.04, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.05714285714285714, "eval_ORGANIZATION_recall": 0.03076923076923077, "eval_PERSON_f1": 0.5449438202247192, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.470873786407767, "eval_PERSON_recall": 0.6466666666666666, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.43478260869565216, "eval_TIME_number": 28, "eval_TIME_precision": 0.5555555555555556, "eval_TIME_recall": 0.35714285714285715, "eval_loss": 0.41943466663360596, "eval_overall_accuracy": 0.8877303588748787, "eval_overall_f1": 0.3803486529318542, "eval_overall_precision": 0.4225352112676056, "eval_overall_recall": 0.345821325648415, "eval_runtime": 0.3288, "eval_samples_per_second": 568.708, "eval_steps_per_second": 9.124, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.2039958238601685, "learning_rate": 4.85e-05, "loss": 0.3968, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.5153374233128835, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.45652173913043476, "eval_LOCATION_recall": 0.5915492957746479, "eval_ORGANIZATION_f1": 0.3278688524590164, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.3508771929824561, "eval_ORGANIZATION_recall": 0.3076923076923077, "eval_PERSON_f1": 0.6829268292682927, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.5753424657534246, "eval_PERSON_recall": 0.84, "eval_QUANTITY_f1": 0.1846153846153846, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.1875, "eval_QUANTITY_recall": 0.18181818181818182, "eval_TIME_f1": 0.8076923076923077, "eval_TIME_number": 28, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.75, "eval_loss": 0.30941861867904663, "eval_overall_accuracy": 0.9202230843840931, "eval_overall_f1": 0.5577172503242542, "eval_overall_precision": 0.5070754716981132, "eval_overall_recall": 0.6195965417867435, "eval_runtime": 0.3381, "eval_samples_per_second": 553.069, "eval_steps_per_second": 8.873, "step": 318 }, { "epoch": 4.0, "grad_norm": 4.7056145668029785, "learning_rate": 4.8e-05, "loss": 0.2937, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.5465116279069767, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.46534653465346537, "eval_LOCATION_recall": 0.6619718309859155, "eval_ORGANIZATION_f1": 0.4878048780487805, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5172413793103449, "eval_ORGANIZATION_recall": 0.46153846153846156, "eval_PERSON_f1": 0.8036809815950918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7443181818181818, "eval_PERSON_recall": 0.8733333333333333, "eval_QUANTITY_f1": 0.47368421052631576, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.4186046511627907, "eval_QUANTITY_recall": 0.5454545454545454, "eval_TIME_f1": 0.8363636363636364, "eval_TIME_number": 28, "eval_TIME_precision": 0.8518518518518519, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.2222605049610138, "eval_overall_accuracy": 0.9369544131910766, "eval_overall_f1": 0.6622340425531915, "eval_overall_precision": 0.6148148148148148, "eval_overall_recall": 0.7175792507204611, "eval_runtime": 0.3282, "eval_samples_per_second": 569.698, "eval_steps_per_second": 9.14, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.303191900253296, "learning_rate": 4.75e-05, "loss": 0.2294, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.6496815286624205, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5930232558139535, "eval_LOCATION_recall": 0.7183098591549296, "eval_ORGANIZATION_f1": 0.562962962962963, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5428571428571428, "eval_ORGANIZATION_recall": 0.5846153846153846, "eval_PERSON_f1": 0.8176100628930819, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7738095238095238, "eval_PERSON_recall": 0.8666666666666667, "eval_QUANTITY_f1": 0.5316455696202532, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.45652173913043476, "eval_QUANTITY_recall": 0.6363636363636364, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.18041133880615234, "eval_overall_accuracy": 0.9427740058195926, "eval_overall_f1": 0.7106325706594886, "eval_overall_precision": 0.6666666666666666, "eval_overall_recall": 0.760806916426513, "eval_runtime": 0.3291, "eval_samples_per_second": 568.165, "eval_steps_per_second": 9.115, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.6567788124084473, "learning_rate": 4.7e-05, "loss": 0.1955, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7052023121387284, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5980392156862745, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.5903614457831325, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.48514851485148514, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8109756097560976, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7471910112359551, "eval_PERSON_recall": 0.8866666666666667, "eval_QUANTITY_f1": 0.5517241379310345, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.4444444444444444, "eval_QUANTITY_recall": 0.7272727272727273, "eval_TIME_f1": 0.793103448275862, "eval_TIME_number": 28, "eval_TIME_precision": 0.7666666666666667, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.19565138220787048, "eval_overall_accuracy": 0.9396217264791464, "eval_overall_f1": 0.7142857142857143, "eval_overall_precision": 0.6236559139784946, "eval_overall_recall": 0.8357348703170029, "eval_runtime": 0.3291, "eval_samples_per_second": 568.21, "eval_steps_per_second": 9.116, "step": 636 }, { "epoch": 7.0, "grad_norm": 2.8131422996520996, "learning_rate": 4.6500000000000005e-05, "loss": 0.1799, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7374999999999999, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6629213483146067, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.6482758620689656, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5875, "eval_ORGANIZATION_recall": 0.7230769230769231, "eval_PERSON_f1": 0.81875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7705882352941177, "eval_PERSON_recall": 0.8733333333333333, "eval_QUANTITY_f1": 0.6585365853658536, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5510204081632653, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16057299077510834, "eval_overall_accuracy": 0.9468962172647915, "eval_overall_f1": 0.7529411764705883, "eval_overall_precision": 0.6889952153110048, "eval_overall_recall": 0.829971181556196, "eval_runtime": 0.3295, "eval_samples_per_second": 567.569, "eval_steps_per_second": 9.105, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.7265537977218628, "learning_rate": 4.600000000000001e-05, "loss": 0.1628, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7349397590361445, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6421052631578947, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.6451612903225806, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5555555555555556, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8275862068965518, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7810650887573964, "eval_PERSON_recall": 0.88, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15270720422267914, "eval_overall_accuracy": 0.9510184287099903, "eval_overall_f1": 0.7587096774193549, "eval_overall_precision": 0.6869158878504673, "eval_overall_recall": 0.8472622478386167, "eval_runtime": 0.3291, "eval_samples_per_second": 568.147, "eval_steps_per_second": 9.115, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.15663743019104, "learning_rate": 4.55e-05, "loss": 0.1528, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7564102564102564, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6941176470588235, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.6351351351351351, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5662650602409639, "eval_ORGANIZATION_recall": 0.7230769230769231, "eval_PERSON_f1": 0.8397435897435898, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.808641975308642, "eval_PERSON_recall": 0.8733333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14164027571678162, "eval_overall_accuracy": 0.9522308438409312, "eval_overall_f1": 0.7727272727272728, "eval_overall_precision": 0.7206982543640897, "eval_overall_recall": 0.8328530259365994, "eval_runtime": 0.3351, "eval_samples_per_second": 558.073, "eval_steps_per_second": 8.953, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.8798385858535767, "learning_rate": 4.5e-05, "loss": 0.1466, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7307692307692307, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6705882352941176, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.625, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.569620253164557, "eval_ORGANIZATION_recall": 0.6923076923076923, "eval_PERSON_f1": 0.8387096774193549, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8125, "eval_PERSON_recall": 0.8666666666666667, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14073340594768524, "eval_overall_accuracy": 0.9522308438409312, "eval_overall_f1": 0.7661290322580645, "eval_overall_precision": 0.7178841309823678, "eval_overall_recall": 0.8213256484149856, "eval_runtime": 0.3345, "eval_samples_per_second": 559.032, "eval_steps_per_second": 8.968, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.9395531415939331, "learning_rate": 4.4500000000000004e-05, "loss": 0.138, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.775, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6966292134831461, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6666666666666666, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5975609756097561, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8360128617363344, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8074534161490683, "eval_PERSON_recall": 0.8666666666666667, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14058995246887207, "eval_overall_accuracy": 0.9536857419980601, "eval_overall_f1": 0.7819148936170213, "eval_overall_precision": 0.725925925925926, "eval_overall_recall": 0.8472622478386167, "eval_runtime": 0.3303, "eval_samples_per_second": 566.135, "eval_steps_per_second": 9.082, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.2153416872024536, "learning_rate": 4.4000000000000006e-05, "loss": 0.1314, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.775, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6966292134831461, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6578947368421053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5747126436781609, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8407643312101911, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8048780487804879, "eval_PERSON_recall": 0.88, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14196860790252686, "eval_overall_accuracy": 0.953443258971872, "eval_overall_f1": 0.7769028871391075, "eval_overall_precision": 0.7132530120481928, "eval_overall_recall": 0.8530259365994236, "eval_runtime": 0.3295, "eval_samples_per_second": 567.586, "eval_steps_per_second": 9.106, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.6423377990722656, "learning_rate": 4.35e-05, "loss": 0.1285, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7261146496815286, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6627906976744186, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.6493506493506495, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5617977528089888, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8461538461538461, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8148148148148148, "eval_PERSON_recall": 0.88, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13416315615177155, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.7755644090305446, "eval_overall_precision": 0.7192118226600985, "eval_overall_recall": 0.8414985590778098, "eval_runtime": 0.3353, "eval_samples_per_second": 557.743, "eval_steps_per_second": 8.948, "step": 1378 }, { "epoch": 14.0, "grad_norm": 3.325246572494507, "learning_rate": 4.3e-05, "loss": 0.1301, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.5915492957746479, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5454545454545454, "eval_ORGANIZATION_recall": 0.6461538461538462, "eval_PERSON_f1": 0.8488745980707395, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8198757763975155, "eval_PERSON_recall": 0.88, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12784981727600098, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.778833107191316, "eval_overall_precision": 0.735897435897436, "eval_overall_recall": 0.8270893371757925, "eval_runtime": 0.3291, "eval_samples_per_second": 568.237, "eval_steps_per_second": 9.116, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.1983723640441895, "learning_rate": 4.25e-05, "loss": 0.1197, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.779874213836478, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7045454545454546, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7012987012987013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6067415730337079, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8471337579617835, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8109756097560976, "eval_PERSON_recall": 0.8866666666666667, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1395217925310135, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.7874015748031495, "eval_overall_precision": 0.7228915662650602, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.3284, "eval_samples_per_second": 569.403, "eval_steps_per_second": 9.135, "step": 1590 }, { "epoch": 16.0, "grad_norm": 2.9908885955810547, "learning_rate": 4.2e-05, "loss": 0.1147, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6853146853146853, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6282051282051282, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8461538461538461, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8148148148148148, "eval_PERSON_recall": 0.88, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13548891246318817, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.787716955941255, "eval_overall_precision": 0.7338308457711443, "eval_overall_recall": 0.8501440922190202, "eval_runtime": 0.3343, "eval_samples_per_second": 559.383, "eval_steps_per_second": 8.974, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.7757030129432678, "learning_rate": 4.15e-05, "loss": 0.1134, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.6618705035971223, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6216216216216216, "eval_ORGANIZATION_recall": 0.7076923076923077, "eval_PERSON_f1": 0.8498402555910542, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8159509202453987, "eval_PERSON_recall": 0.8866666666666667, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12935349345207214, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.7875507442489851, "eval_overall_precision": 0.7423469387755102, "eval_overall_recall": 0.8386167146974063, "eval_runtime": 0.3301, "eval_samples_per_second": 566.53, "eval_steps_per_second": 9.089, "step": 1802 }, { "epoch": 18.0, "grad_norm": 1.1819586753845215, "learning_rate": 4.1e-05, "loss": 0.1103, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7162162162162162, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6385542168674698, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8507936507936508, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8121212121212121, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13496747612953186, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8015978695073236, "eval_overall_precision": 0.745049504950495, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3289, "eval_samples_per_second": 568.537, "eval_steps_per_second": 9.121, "step": 1908 }, { "epoch": 19.0, "grad_norm": 1.253257393836975, "learning_rate": 4.05e-05, "loss": 0.1078, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7162162162162162, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6385542168674698, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8498402555910542, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8159509202453987, "eval_PERSON_recall": 0.8866666666666667, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13079425692558289, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.7999999999999999, "eval_overall_precision": 0.7487437185929648, "eval_overall_recall": 0.8587896253602305, "eval_runtime": 0.3341, "eval_samples_per_second": 559.714, "eval_steps_per_second": 8.979, "step": 2014 }, { "epoch": 20.0, "grad_norm": 1.522292137145996, "learning_rate": 4e-05, "loss": 0.1051, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6814814814814816, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7076923076923077, "eval_PERSON_f1": 0.858974358974359, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8271604938271605, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12830358743667603, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8054794520547945, "eval_overall_precision": 0.7676240208877284, "eval_overall_recall": 0.8472622478386167, "eval_runtime": 0.3284, "eval_samples_per_second": 569.369, "eval_steps_per_second": 9.134, "step": 2120 }, { "epoch": 21.0, "grad_norm": 1.3046311140060425, "learning_rate": 3.9500000000000005e-05, "loss": 0.1013, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7210884353741497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6463414634146342, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8507936507936508, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8121212121212121, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1330733597278595, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8048128342245989, "eval_overall_precision": 0.7506234413965087, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.335, "eval_samples_per_second": 558.137, "eval_steps_per_second": 8.954, "step": 2226 }, { "epoch": 22.0, "grad_norm": 1.648231863975525, "learning_rate": 3.9000000000000006e-05, "loss": 0.1015, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.7625, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6853932584269663, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7044025157232704, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5957446808510638, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8481012658227848, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8072289156626506, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1461816430091858, "eval_overall_accuracy": 0.9529582929194956, "eval_overall_f1": 0.7900912646675358, "eval_overall_precision": 0.7214285714285714, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3294, "eval_samples_per_second": 567.654, "eval_steps_per_second": 9.107, "step": 2332 }, { "epoch": 23.0, "grad_norm": 1.236881136894226, "learning_rate": 3.85e-05, "loss": 0.0952, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7375886524822695, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6842105263157895, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8525641025641025, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.8866666666666667, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12616348266601562, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8180574555403557, "eval_overall_precision": 0.7786458333333334, "eval_overall_recall": 0.861671469740634, "eval_runtime": 0.3359, "eval_samples_per_second": 556.671, "eval_steps_per_second": 8.931, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.727121353149414, "learning_rate": 3.8e-05, "loss": 0.0957, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7105263157894737, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8454258675078864, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8023952095808383, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14105214178562164, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.7962962962962963, "eval_overall_precision": 0.7359413202933985, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3291, "eval_samples_per_second": 568.152, "eval_steps_per_second": 9.115, "step": 2544 }, { "epoch": 25.0, "grad_norm": 1.6316332817077637, "learning_rate": 3.7500000000000003e-05, "loss": 0.0913, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8544303797468354, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8132530120481928, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6363636363636364, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13811782002449036, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8117489986648865, "eval_overall_precision": 0.7562189054726368, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3289, "eval_samples_per_second": 568.489, "eval_steps_per_second": 9.12, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.5518941879272461, "learning_rate": 3.7e-05, "loss": 0.091, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6708860759493671, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8643533123028392, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8203592814371258, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7179487179487178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6222222222222222, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13771426677703857, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.808, "eval_overall_precision": 0.7518610421836228, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3343, "eval_samples_per_second": 559.442, "eval_steps_per_second": 8.975, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.4636467695236206, "learning_rate": 3.65e-05, "loss": 0.0902, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7248322147651007, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8517350157728706, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8083832335329342, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.6582278481012658, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5652173913043478, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14399109780788422, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.7894736842105263, "eval_overall_precision": 0.7263922518159807, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.3358, "eval_samples_per_second": 556.812, "eval_steps_per_second": 8.933, "step": 2862 }, { "epoch": 28.0, "grad_norm": 1.3473738431930542, "learning_rate": 3.6e-05, "loss": 0.087, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6179775280898876, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8626198083067093, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1355486363172531, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8118279569892473, "eval_overall_precision": 0.760705289672544, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3366, "eval_samples_per_second": 555.494, "eval_steps_per_second": 8.912, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.5319921970367432, "learning_rate": 3.55e-05, "loss": 0.0849, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.6923076923076923, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5934065934065934, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8507936507936508, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8121212121212121, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13350827991962433, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.7989347536617842, "eval_overall_precision": 0.7425742574257426, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.3368, "eval_samples_per_second": 555.248, "eval_steps_per_second": 8.908, "step": 3074 }, { "epoch": 30.0, "grad_norm": 1.0683906078338623, "learning_rate": 3.5e-05, "loss": 0.0815, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7310344827586207, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6625, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13375303149223328, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8184281842818427, "eval_overall_precision": 0.7723785166240409, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3368, "eval_samples_per_second": 555.175, "eval_steps_per_second": 8.907, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.8525239825248718, "learning_rate": 3.45e-05, "loss": 0.0838, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7333333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13723136484622955, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8133333333333335, "eval_overall_precision": 0.7568238213399504, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.334, "eval_samples_per_second": 559.823, "eval_steps_per_second": 8.981, "step": 3286 }, { "epoch": 32.0, "grad_norm": 1.4616408348083496, "learning_rate": 3.4000000000000007e-05, "loss": 0.076, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.708860759493671, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6021505376344086, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8643533123028392, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8203592814371258, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1504770815372467, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.7989556135770235, "eval_overall_precision": 0.7303102625298329, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3282, "eval_samples_per_second": 569.822, "eval_steps_per_second": 9.142, "step": 3392 }, { "epoch": 33.0, "grad_norm": 2.1258466243743896, "learning_rate": 3.35e-05, "loss": 0.0775, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.72992700729927, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6944444444444444, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.8000000000000002, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7567567567567568, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13078542053699493, "eval_overall_accuracy": 0.9633850630455868, "eval_overall_f1": 0.8264462809917356, "eval_overall_precision": 0.7915567282321899, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.3348, "eval_samples_per_second": 558.49, "eval_steps_per_second": 8.96, "step": 3498 }, { "epoch": 34.0, "grad_norm": 1.6660958528518677, "learning_rate": 3.3e-05, "loss": 0.0768, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8681672025723473, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8385093167701864, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13354364037513733, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8254397834912043, "eval_overall_precision": 0.7780612244897959, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3339, "eval_samples_per_second": 560.029, "eval_steps_per_second": 8.984, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.7892407774925232, "learning_rate": 3.2500000000000004e-05, "loss": 0.0746, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7549668874172185, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6627906976744186, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1393873244524002, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8225806451612904, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3337, "eval_samples_per_second": 560.376, "eval_steps_per_second": 8.99, "step": 3710 }, { "epoch": 36.0, "grad_norm": 1.38412344455719, "learning_rate": 3.2000000000000005e-05, "loss": 0.0724, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7051282051282052, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6043956043956044, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8589341692789968, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8106508875739645, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.8169014084507042, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7631578947368421, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14194774627685547, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8110964332892999, "eval_overall_precision": 0.748780487804878, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3344, "eval_samples_per_second": 559.292, "eval_steps_per_second": 8.973, "step": 3816 }, { "epoch": 37.0, "grad_norm": 1.6571606397628784, "learning_rate": 3.15e-05, "loss": 0.0703, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.7672955974842768, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6931818181818182, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.708860759493671, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6021505376344086, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8698412698412699, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15663577616214752, "eval_overall_accuracy": 0.9517458777885548, "eval_overall_f1": 0.7973856209150326, "eval_overall_precision": 0.7296650717703349, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3366, "eval_samples_per_second": 555.525, "eval_steps_per_second": 8.912, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.8099401593208313, "learning_rate": 3.1e-05, "loss": 0.07, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6835443037974683, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5869565217391305, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14580821990966797, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8090185676392573, "eval_overall_precision": 0.7493857493857494, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3346, "eval_samples_per_second": 558.844, "eval_steps_per_second": 8.965, "step": 4028 }, { "epoch": 39.0, "grad_norm": 1.7465280294418335, "learning_rate": 3.05e-05, "loss": 0.0688, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.713375796178344, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14488695561885834, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8158940397350992, "eval_overall_precision": 0.7549019607843137, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3336, "eval_samples_per_second": 560.471, "eval_steps_per_second": 8.992, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.8754693269729614, "learning_rate": 3e-05, "loss": 0.0691, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13563859462738037, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8281461434370772, "eval_overall_precision": 0.7806122448979592, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3295, "eval_samples_per_second": 567.559, "eval_steps_per_second": 9.105, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.3340809941291809, "learning_rate": 2.95e-05, "loss": 0.0673, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.6962025316455697, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5913978494623656, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8698412698412699, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15314164757728577, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.7958115183246073, "eval_overall_precision": 0.7290167865707434, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3349, "eval_samples_per_second": 558.392, "eval_steps_per_second": 8.958, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.9933107495307922, "learning_rate": 2.9e-05, "loss": 0.0663, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8653846153846153, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1424974650144577, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8144192256341789, "eval_overall_precision": 0.7587064676616916, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3341, "eval_samples_per_second": 559.709, "eval_steps_per_second": 8.979, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.6678488254547119, "learning_rate": 2.8499999999999998e-05, "loss": 0.0639, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7285714285714285, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.68, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8562300319488818, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8220858895705522, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1413319855928421, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8113975576662144, "eval_overall_precision": 0.7666666666666667, "eval_overall_recall": 0.861671469740634, "eval_runtime": 0.3285, "eval_samples_per_second": 569.242, "eval_steps_per_second": 9.132, "step": 4558 }, { "epoch": 44.0, "grad_norm": 0.8438284993171692, "learning_rate": 2.8000000000000003e-05, "loss": 0.064, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7152317880794703, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.627906976744186, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8698412698412699, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14022959768772125, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8187919463087249, "eval_overall_precision": 0.7663316582914573, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3337, "eval_samples_per_second": 560.437, "eval_steps_per_second": 8.991, "step": 4664 }, { "epoch": 45.0, "grad_norm": 3.699862241744995, "learning_rate": 2.7500000000000004e-05, "loss": 0.0615, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7189542483660131, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15338602662086487, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.8042328042328041, "eval_overall_precision": 0.7432762836185819, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.329, "eval_samples_per_second": 568.326, "eval_steps_per_second": 9.118, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.7766585946083069, "learning_rate": 2.7000000000000002e-05, "loss": 0.0614, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7236842105263158, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14268124103546143, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8221024258760108, "eval_overall_precision": 0.7721518987341772, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3343, "eval_samples_per_second": 559.326, "eval_steps_per_second": 8.973, "step": 4876 }, { "epoch": 47.0, "grad_norm": 1.664536476135254, "learning_rate": 2.6500000000000004e-05, "loss": 0.0595, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8761904761904761, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8363636363636363, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.154044508934021, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8174603174603176, "eval_overall_precision": 0.7555012224938875, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3363, "eval_samples_per_second": 555.98, "eval_steps_per_second": 8.919, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.3004956245422363, "learning_rate": 2.6000000000000002e-05, "loss": 0.0594, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7189542483660131, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8690095846645367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1491357684135437, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8154050464807437, "eval_overall_precision": 0.7561576354679803, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3302, "eval_samples_per_second": 566.352, "eval_steps_per_second": 9.086, "step": 5088 }, { "epoch": 49.0, "grad_norm": 1.524907112121582, "learning_rate": 2.5500000000000003e-05, "loss": 0.0579, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.697986577181208, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6190476190476191, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8726114649681529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14881013333797455, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8095872170439414, "eval_overall_precision": 0.7524752475247525, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3347, "eval_samples_per_second": 558.754, "eval_steps_per_second": 8.964, "step": 5194 }, { "epoch": 50.0, "grad_norm": 1.4106496572494507, "learning_rate": 2.5e-05, "loss": 0.0561, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6933333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.611764705882353, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1435040831565857, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8151147098515519, "eval_overall_precision": 0.766497461928934, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3346, "eval_samples_per_second": 558.815, "eval_steps_per_second": 8.965, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.9782974123954773, "learning_rate": 2.45e-05, "loss": 0.056, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6891891891891891, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6144578313253012, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15163768827915192, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.808, "eval_overall_precision": 0.7518610421836228, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3285, "eval_samples_per_second": 569.298, "eval_steps_per_second": 9.133, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.8598395586013794, "learning_rate": 2.4e-05, "loss": 0.0547, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7019867549668873, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.870967741935484, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84375, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15105435252189636, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8091397849462366, "eval_overall_precision": 0.7581863979848866, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3341, "eval_samples_per_second": 559.773, "eval_steps_per_second": 8.98, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.4993176460266113, "learning_rate": 2.35e-05, "loss": 0.0534, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.713375796178344, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16154761612415314, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.8068331143232589, "eval_overall_precision": 0.7415458937198067, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3295, "eval_samples_per_second": 567.521, "eval_steps_per_second": 9.105, "step": 5618 }, { "epoch": 54.0, "grad_norm": 1.0407500267028809, "learning_rate": 2.3000000000000003e-05, "loss": 0.0526, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6967741935483871, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15213675796985626, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8155080213903744, "eval_overall_precision": 0.7605985037406484, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3348, "eval_samples_per_second": 558.56, "eval_steps_per_second": 8.961, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.6406387686729431, "learning_rate": 2.25e-05, "loss": 0.0538, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.7875000000000001, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7078651685393258, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7051282051282052, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6043956043956044, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15997092425823212, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8015768725361366, "eval_overall_precision": 0.7367149758454107, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3348, "eval_samples_per_second": 558.524, "eval_steps_per_second": 8.96, "step": 5830 }, { "epoch": 56.0, "grad_norm": 2.387361526489258, "learning_rate": 2.2000000000000003e-05, "loss": 0.0529, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7096774193548387, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8726114649681529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1578657031059265, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8095238095238096, "eval_overall_precision": 0.7481662591687042, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.336, "eval_samples_per_second": 556.493, "eval_steps_per_second": 8.928, "step": 5936 }, { "epoch": 57.0, "grad_norm": 1.3003697395324707, "learning_rate": 2.15e-05, "loss": 0.05, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6950354609929077, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6447368421052632, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14940249919891357, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8185538881309686, "eval_overall_precision": 0.7772020725388601, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.3282, "eval_samples_per_second": 569.855, "eval_steps_per_second": 9.142, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.7399232387542725, "learning_rate": 2.1e-05, "loss": 0.0512, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7042253521126761, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6493506493506493, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14740602672100067, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8163265306122449, "eval_overall_precision": 0.7731958762886598, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.335, "eval_samples_per_second": 558.203, "eval_steps_per_second": 8.955, "step": 6148 }, { "epoch": 59.0, "grad_norm": 1.4280949831008911, "learning_rate": 2.05e-05, "loss": 0.047, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.7848101265822784, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7126436781609196, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7248322147651007, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15319204330444336, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8187919463087249, "eval_overall_precision": 0.7663316582914573, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3345, "eval_samples_per_second": 558.972, "eval_steps_per_second": 8.967, "step": 6254 }, { "epoch": 60.0, "grad_norm": 1.479651689529419, "learning_rate": 2e-05, "loss": 0.047, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7096774193548387, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.870967741935484, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84375, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.8169014084507042, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7631578947368421, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15390989184379578, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8176943699731903, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3361, "eval_samples_per_second": 556.409, "eval_steps_per_second": 8.926, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.868341326713562, "learning_rate": 1.9500000000000003e-05, "loss": 0.0465, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7105263157894737, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8726114649681529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15987202525138855, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.816, "eval_overall_precision": 0.7593052109181141, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3357, "eval_samples_per_second": 557.069, "eval_steps_per_second": 8.937, "step": 6466 }, { "epoch": 62.0, "grad_norm": 1.9663652181625366, "learning_rate": 1.9e-05, "loss": 0.045, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6973684210526315, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6091954022988506, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1569298505783081, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8176943699731903, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.334, "eval_samples_per_second": 559.847, "eval_steps_per_second": 8.982, "step": 6572 }, { "epoch": 63.0, "grad_norm": 4.453447341918945, "learning_rate": 1.85e-05, "loss": 0.0468, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7114093959731543, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6309523809523809, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.870967741935484, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84375, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1518780142068863, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8195386702849389, "eval_overall_precision": 0.7743589743589744, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3347, "eval_samples_per_second": 558.764, "eval_steps_per_second": 8.964, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.6715424656867981, "learning_rate": 1.8e-05, "loss": 0.0446, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7272727272727272, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15471045672893524, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8201634877384196, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3347, "eval_samples_per_second": 558.76, "eval_steps_per_second": 8.964, "step": 6784 }, { "epoch": 65.0, "grad_norm": 1.4069435596466064, "learning_rate": 1.75e-05, "loss": 0.0452, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7051282051282052, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6043956043956044, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16312921047210693, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8149134487350199, "eval_overall_precision": 0.7574257425742574, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3337, "eval_samples_per_second": 560.419, "eval_steps_per_second": 8.991, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.9711624383926392, "learning_rate": 1.7000000000000003e-05, "loss": 0.0442, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7051282051282052, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6043956043956044, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1615941822528839, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8175765645805593, "eval_overall_precision": 0.7599009900990099, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3285, "eval_samples_per_second": 569.32, "eval_steps_per_second": 9.133, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.3948928415775299, "learning_rate": 1.65e-05, "loss": 0.0431, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.7898089171974522, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7209302325581395, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7019867549668873, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8690095846645367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16082525253295898, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8117489986648865, "eval_overall_precision": 0.7562189054726368, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3338, "eval_samples_per_second": 560.26, "eval_steps_per_second": 8.988, "step": 7102 }, { "epoch": 68.0, "grad_norm": 1.975942611694336, "learning_rate": 1.6000000000000003e-05, "loss": 0.0427, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6179775280898876, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8690095846645367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16873115301132202, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8047493403693932, "eval_overall_precision": 0.7420924574209246, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3298, "eval_samples_per_second": 567.09, "eval_steps_per_second": 9.098, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.47350606322288513, "learning_rate": 1.55e-05, "loss": 0.043, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7012987012987013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6067415730337079, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16365033388137817, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8138297872340426, "eval_overall_precision": 0.7555555555555555, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3349, "eval_samples_per_second": 558.297, "eval_steps_per_second": 8.957, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.45649945735931396, "learning_rate": 1.5e-05, "loss": 0.0426, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16292014718055725, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.816, "eval_overall_precision": 0.7593052109181141, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3342, "eval_samples_per_second": 559.604, "eval_steps_per_second": 8.978, "step": 7420 }, { "epoch": 71.0, "grad_norm": 2.033871650695801, "learning_rate": 1.45e-05, "loss": 0.0439, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.775, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6966292134831461, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7080745341614907, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.59375, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7631578947368421, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6744186046511628, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1787422150373459, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.81151832460733, "eval_overall_precision": 0.7434052757793765, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3358, "eval_samples_per_second": 556.823, "eval_steps_per_second": 8.933, "step": 7526 }, { "epoch": 72.0, "grad_norm": 1.839992642402649, "learning_rate": 1.4000000000000001e-05, "loss": 0.0409, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7105263157894737, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16144876182079315, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8172043010752689, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3288, "eval_samples_per_second": 568.779, "eval_steps_per_second": 9.125, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.7383960485458374, "learning_rate": 1.3500000000000001e-05, "loss": 0.0404, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6928104575163399, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6022727272727273, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16545303165912628, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8122503328894807, "eval_overall_precision": 0.754950495049505, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3357, "eval_samples_per_second": 557.128, "eval_steps_per_second": 8.938, "step": 7738 }, { "epoch": 74.0, "grad_norm": 1.1772239208221436, "learning_rate": 1.3000000000000001e-05, "loss": 0.0399, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6883116883116883, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5955056179775281, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16691727936267853, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8133333333333335, "eval_overall_precision": 0.7568238213399504, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3275, "eval_samples_per_second": 570.978, "eval_steps_per_second": 9.16, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.3011506497859955, "learning_rate": 1.25e-05, "loss": 0.04, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7105263157894737, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16395699977874756, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7630922693266833, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3338, "eval_samples_per_second": 560.152, "eval_steps_per_second": 8.986, "step": 7950 }, { "epoch": 76.0, "grad_norm": 1.2410697937011719, "learning_rate": 1.2e-05, "loss": 0.0402, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7012987012987013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6067415730337079, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16832870244979858, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8127490039840637, "eval_overall_precision": 0.7536945812807881, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3293, "eval_samples_per_second": 567.933, "eval_steps_per_second": 9.111, "step": 8056 }, { "epoch": 77.0, "grad_norm": 1.8908904790878296, "learning_rate": 1.1500000000000002e-05, "loss": 0.0402, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.7875000000000001, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7078651685393258, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7066666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8690095846645367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17024052143096924, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8095872170439414, "eval_overall_precision": 0.7524752475247525, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3354, "eval_samples_per_second": 557.526, "eval_steps_per_second": 8.944, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.9162412881851196, "learning_rate": 1.1000000000000001e-05, "loss": 0.0379, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6928104575163399, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6022727272727273, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8653846153846153, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16936184465885162, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8095872170439414, "eval_overall_precision": 0.7524752475247525, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3352, "eval_samples_per_second": 557.918, "eval_steps_per_second": 8.951, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.6435752511024475, "learning_rate": 1.05e-05, "loss": 0.0371, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6883116883116883, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5955056179775281, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1731194704771042, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8100929614873836, "eval_overall_precision": 0.7512315270935961, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3345, "eval_samples_per_second": 559.06, "eval_steps_per_second": 8.969, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.5504117608070374, "learning_rate": 1e-05, "loss": 0.0375, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8025477707006369, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7325581395348837, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6883116883116883, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5955056179775281, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17014098167419434, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8144192256341789, "eval_overall_precision": 0.7587064676616916, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3343, "eval_samples_per_second": 559.339, "eval_steps_per_second": 8.973, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.46581876277923584, "learning_rate": 9.5e-06, "loss": 0.0367, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.7898089171974522, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7209302325581395, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6883116883116883, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5955056179775281, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8726114649681529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16831910610198975, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8100929614873836, "eval_overall_precision": 0.7512315270935961, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3306, "eval_samples_per_second": 565.697, "eval_steps_per_second": 9.075, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.1437621116638184, "learning_rate": 9e-06, "loss": 0.0369, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6794871794871795, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5824175824175825, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17457380890846252, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8132450331125827, "eval_overall_precision": 0.7524509803921569, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3281, "eval_samples_per_second": 569.937, "eval_steps_per_second": 9.143, "step": 8692 }, { "epoch": 83.0, "grad_norm": 1.673567771911621, "learning_rate": 8.500000000000002e-06, "loss": 0.0382, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7848101265822784, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7126436781609196, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7019867549668873, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8690095846645367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16617552936077118, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8106666666666668, "eval_overall_precision": 0.7543424317617866, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3288, "eval_samples_per_second": 568.811, "eval_steps_per_second": 9.125, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.8704581260681152, "learning_rate": 8.000000000000001e-06, "loss": 0.0376, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6973684210526315, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6091954022988506, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16935382783412933, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8133333333333335, "eval_overall_precision": 0.7568238213399504, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3375, "eval_samples_per_second": 554.036, "eval_steps_per_second": 8.888, "step": 8904 }, { "epoch": 85.0, "grad_norm": 2.838458299636841, "learning_rate": 7.5e-06, "loss": 0.0372, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7006369426751592, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5978260869565217, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17407700419425964, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8143236074270557, "eval_overall_precision": 0.7542997542997543, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3278, "eval_samples_per_second": 570.491, "eval_steps_per_second": 9.152, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.5828319191932678, "learning_rate": 7.000000000000001e-06, "loss": 0.0351, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6928104575163399, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6022727272727273, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17182248830795288, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8111702127659575, "eval_overall_precision": 0.7530864197530864, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3288, "eval_samples_per_second": 568.789, "eval_steps_per_second": 9.125, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.9350789189338684, "learning_rate": 6.5000000000000004e-06, "loss": 0.0348, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6838709677419356, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5888888888888889, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17128072679042816, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8100929614873836, "eval_overall_precision": 0.7512315270935961, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3283, "eval_samples_per_second": 569.617, "eval_steps_per_second": 9.138, "step": 9222 }, { "epoch": 88.0, "grad_norm": 1.2203199863433838, "learning_rate": 6e-06, "loss": 0.0363, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6973684210526315, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6091954022988506, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17074672877788544, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8144192256341789, "eval_overall_precision": 0.7587064676616916, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3349, "eval_samples_per_second": 558.334, "eval_steps_per_second": 8.957, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.67624431848526, "learning_rate": 5.500000000000001e-06, "loss": 0.0371, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6883116883116883, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5955056179775281, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17176063358783722, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8116710875331565, "eval_overall_precision": 0.7518427518427518, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3296, "eval_samples_per_second": 567.418, "eval_steps_per_second": 9.103, "step": 9434 }, { "epoch": 90.0, "grad_norm": 1.9259661436080933, "learning_rate": 5e-06, "loss": 0.0367, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8025477707006369, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7325581395348837, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6973684210526315, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6091954022988506, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17073224484920502, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.820855614973262, "eval_overall_precision": 0.7655860349127181, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3289, "eval_samples_per_second": 568.538, "eval_steps_per_second": 9.121, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.5366353392601013, "learning_rate": 4.5e-06, "loss": 0.0349, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7096774193548387, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17369931936264038, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8154050464807437, "eval_overall_precision": 0.7561576354679803, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3356, "eval_samples_per_second": 557.153, "eval_steps_per_second": 8.938, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.7619331479072571, "learning_rate": 4.000000000000001e-06, "loss": 0.0357, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8025477707006369, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7325581395348837, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7066666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16904906928539276, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8192771084337349, "eval_overall_precision": 0.765, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3298, "eval_samples_per_second": 567.039, "eval_steps_per_second": 9.097, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.7772564888000488, "learning_rate": 3.5000000000000004e-06, "loss": 0.0345, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7019867549668873, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17138922214508057, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7611940298507462, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3291, "eval_samples_per_second": 568.133, "eval_steps_per_second": 9.114, "step": 9858 }, { "epoch": 94.0, "grad_norm": 1.5932378768920898, "learning_rate": 3e-06, "loss": 0.0349, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6838709677419356, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5888888888888889, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1765890270471573, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8138297872340426, "eval_overall_precision": 0.7555555555555555, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3307, "eval_samples_per_second": 565.487, "eval_steps_per_second": 9.072, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.8269696235656738, "learning_rate": 2.5e-06, "loss": 0.0352, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6838709677419356, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5888888888888889, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17644113302230835, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8127490039840637, "eval_overall_precision": 0.7536945812807881, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3354, "eval_samples_per_second": 557.581, "eval_steps_per_second": 8.945, "step": 10070 }, { "epoch": 96.0, "grad_norm": 1.2851319313049316, "learning_rate": 2.0000000000000003e-06, "loss": 0.0367, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6973684210526315, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6091954022988506, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17299894988536835, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.816, "eval_overall_precision": 0.7593052109181141, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3376, "eval_samples_per_second": 553.982, "eval_steps_per_second": 8.887, "step": 10176 }, { "epoch": 97.0, "grad_norm": 1.469909906387329, "learning_rate": 1.5e-06, "loss": 0.0352, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6928104575163399, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6022727272727273, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1724460870027542, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7611940298507462, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3347, "eval_samples_per_second": 558.712, "eval_steps_per_second": 8.963, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.9896478652954102, "learning_rate": 1.0000000000000002e-06, "loss": 0.0341, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6794871794871795, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5824175824175825, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1747630089521408, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8100929614873836, "eval_overall_precision": 0.7512315270935961, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3294, "eval_samples_per_second": 567.729, "eval_steps_per_second": 9.108, "step": 10388 }, { "epoch": 99.0, "grad_norm": 1.395708441734314, "learning_rate": 5.000000000000001e-07, "loss": 0.0331, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6928104575163399, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6022727272727273, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17256887257099152, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8133333333333335, "eval_overall_precision": 0.7568238213399504, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3298, "eval_samples_per_second": 567.096, "eval_steps_per_second": 9.098, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.4935811758041382, "learning_rate": 0.0, "loss": 0.0347, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6928104575163399, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6022727272727273, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17283295094966888, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8133333333333335, "eval_overall_precision": 0.7568238213399504, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.33, "eval_samples_per_second": 566.66, "eval_steps_per_second": 9.091, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 4639858441347408.0, "train_loss": 0.08816910017211482, "train_runtime": 595.5845, "train_samples_per_second": 283.419, "train_steps_per_second": 17.798 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 4639858441347408.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }