{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.2026894092559814, "learning_rate": 4.9500000000000004e-05, "loss": 0.959, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.013071895424836602, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.3333333333333333, "eval_PERSON_recall": 0.006666666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 28, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.6148647665977478, "eval_overall_accuracy": 0.8414161008729389, "eval_overall_f1": 0.005714285714285714, "eval_overall_precision": 0.3333333333333333, "eval_overall_recall": 0.002881844380403458, "eval_runtime": 1.0478, "eval_samples_per_second": 178.467, "eval_steps_per_second": 2.863, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.3476005792617798, "learning_rate": 4.9e-05, "loss": 0.5147, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.4705882352941176, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5833333333333334, "eval_LOCATION_recall": 0.39436619718309857, "eval_ORGANIZATION_f1": 0.21739130434782608, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.2054794520547945, "eval_ORGANIZATION_recall": 0.23076923076923078, "eval_PERSON_f1": 0.6720867208672087, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.5662100456621004, "eval_PERSON_recall": 0.8266666666666667, "eval_QUANTITY_f1": 0.21875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.22580645161290322, "eval_QUANTITY_recall": 0.21212121212121213, "eval_TIME_f1": 0.5555555555555555, "eval_TIME_number": 28, "eval_TIME_precision": 0.5769230769230769, "eval_TIME_recall": 0.5357142857142857, "eval_loss": 0.35546213388442993, "eval_overall_accuracy": 0.9059165858389913, "eval_overall_f1": 0.5080645161290323, "eval_overall_precision": 0.4760705289672544, "eval_overall_recall": 0.5446685878962536, "eval_runtime": 1.0899, "eval_samples_per_second": 171.576, "eval_steps_per_second": 2.753, "step": 212 }, { "epoch": 3.0, "grad_norm": 0.8558968901634216, "learning_rate": 4.85e-05, "loss": 0.3082, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.5911949685534591, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5340909090909091, "eval_LOCATION_recall": 0.6619718309859155, "eval_ORGANIZATION_f1": 0.5846153846153846, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5846153846153846, "eval_ORGANIZATION_recall": 0.5846153846153846, "eval_PERSON_f1": 0.8307692307692307, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7714285714285715, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.44999999999999996, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.3829787234042553, "eval_QUANTITY_recall": 0.5454545454545454, "eval_TIME_f1": 0.830188679245283, "eval_TIME_number": 28, "eval_TIME_precision": 0.88, "eval_TIME_recall": 0.7857142857142857, "eval_loss": 0.19337795674800873, "eval_overall_accuracy": 0.9357419980601358, "eval_overall_f1": 0.6961178045515395, "eval_overall_precision": 0.65, "eval_overall_recall": 0.7492795389048992, "eval_runtime": 1.0801, "eval_samples_per_second": 173.132, "eval_steps_per_second": 2.778, "step": 318 }, { "epoch": 4.0, "grad_norm": 0.8656661510467529, "learning_rate": 4.8e-05, "loss": 0.2009, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.675, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6067415730337079, "eval_LOCATION_recall": 0.7605633802816901, "eval_ORGANIZATION_f1": 0.6114649681528661, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5217391304347826, "eval_ORGANIZATION_recall": 0.7384615384615385, "eval_PERSON_f1": 0.8517350157728706, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8083832335329342, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.48101265822784817, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.41304347826086957, "eval_QUANTITY_recall": 0.5757575757575758, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16201776266098022, "eval_overall_accuracy": 0.9415615906886518, "eval_overall_f1": 0.7282184655396619, "eval_overall_precision": 0.6635071090047393, "eval_overall_recall": 0.8069164265129684, "eval_runtime": 1.0458, "eval_samples_per_second": 178.803, "eval_steps_per_second": 2.869, "step": 424 }, { "epoch": 5.0, "grad_norm": 0.9101278185844421, "learning_rate": 4.75e-05, "loss": 0.1747, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7317073170731706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6451612903225806, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6621621621621622, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5903614457831325, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8698412698412699, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7796610169491526, "eval_TIME_number": 28, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.14107052981853485, "eval_overall_accuracy": 0.9510184287099903, "eval_overall_f1": 0.7769028871391075, "eval_overall_precision": 0.7132530120481928, "eval_overall_recall": 0.8530259365994236, "eval_runtime": 1.0459, "eval_samples_per_second": 178.8, "eval_steps_per_second": 2.868, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.2041453123092651, "learning_rate": 4.7e-05, "loss": 0.1564, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7093023255813954, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6039603960396039, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7037037037037037, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5876288659793815, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8359133126934984, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7803468208092486, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.6829268292682927, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5714285714285714, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7164179104477612, "eval_TIME_number": 28, "eval_TIME_precision": 0.6153846153846154, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1720166802406311, "eval_overall_accuracy": 0.9401066925315228, "eval_overall_f1": 0.7568238213399504, "eval_overall_precision": 0.664488017429194, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0496, "eval_samples_per_second": 178.156, "eval_steps_per_second": 2.858, "step": 636 }, { "epoch": 7.0, "grad_norm": 2.570847272872925, "learning_rate": 4.6500000000000005e-05, "loss": 0.1441, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7100591715976331, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6122448979591837, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7080745341614907, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.59375, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8466257668711655, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7840909090909091, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7796610169491526, "eval_TIME_number": 28, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.14682450890541077, "eval_overall_accuracy": 0.9476236663433559, "eval_overall_f1": 0.7737041719342604, "eval_overall_precision": 0.6891891891891891, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0693, "eval_samples_per_second": 174.879, "eval_steps_per_second": 2.806, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.648723304271698, "learning_rate": 4.600000000000001e-05, "loss": 0.1299, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7484662576687117, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6630434782608695, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7236842105263158, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8761904761904761, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8363636363636363, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12678906321525574, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8078947368421052, "eval_overall_precision": 0.7433414043583535, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.0505, "eval_samples_per_second": 178.011, "eval_steps_per_second": 2.856, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.1211426258087158, "learning_rate": 4.55e-05, "loss": 0.1221, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7547169811320754, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6818181818181818, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7248322147651007, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.11980857700109482, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8021248339973439, "eval_overall_precision": 0.7438423645320197, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.0508, "eval_samples_per_second": 177.952, "eval_steps_per_second": 2.855, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.1789932250976562, "learning_rate": 4.5e-05, "loss": 0.1176, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7169811320754716, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6477272727272727, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7552447552447553, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8154761904761905, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6363636363636364, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12928320467472076, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.7957559681697612, "eval_overall_precision": 0.7371007371007371, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 1.0405, "eval_samples_per_second": 179.724, "eval_steps_per_second": 2.883, "step": 1060 }, { "epoch": 11.0, "grad_norm": 1.4546157121658325, "learning_rate": 4.4500000000000004e-05, "loss": 0.1111, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7341772151898733, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6666666666666666, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7323943661971831, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6753246753246753, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7796610169491526, "eval_TIME_number": 28, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.12095968425273895, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8048452220726784, "eval_overall_precision": 0.7550505050505051, "eval_overall_recall": 0.861671469740634, "eval_runtime": 1.1365, "eval_samples_per_second": 164.542, "eval_steps_per_second": 2.64, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.1820521354675293, "learning_rate": 4.4000000000000006e-05, "loss": 0.1026, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7239263803680982, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6413043478260869, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7796610169491526, "eval_TIME_number": 28, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.14555691182613373, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.7947712418300654, "eval_overall_precision": 0.7272727272727273, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0483, "eval_samples_per_second": 178.389, "eval_steps_per_second": 2.862, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.8939817547798157, "learning_rate": 4.35e-05, "loss": 0.0958, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7417218543046357, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7199999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6352941176470588, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12335564196109772, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8070175438596491, "eval_overall_precision": 0.7588832487309645, "eval_overall_recall": 0.861671469740634, "eval_runtime": 1.0637, "eval_samples_per_second": 175.806, "eval_steps_per_second": 2.82, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.7542805671691895, "learning_rate": 4.3e-05, "loss": 0.0963, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7662337662337662, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7397260273972603, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8285714285714285, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7837837837837838, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.11888094246387482, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8238482384823849, "eval_overall_precision": 0.7774936061381074, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0551, "eval_samples_per_second": 177.237, "eval_steps_per_second": 2.843, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.1723530292510986, "learning_rate": 4.25e-05, "loss": 0.0877, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.7307692307692307, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6705882352941176, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.728476821192053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13062922656536102, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8080536912751677, "eval_overall_precision": 0.7562814070351759, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.0529, "eval_samples_per_second": 177.608, "eval_steps_per_second": 2.849, "step": 1590 }, { "epoch": 16.0, "grad_norm": 1.6313313245773315, "learning_rate": 4.2e-05, "loss": 0.0856, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.759493670886076, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6896551724137931, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7796610169491526, "eval_TIME_number": 28, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.1443340927362442, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.8005284015852047, "eval_overall_precision": 0.7390243902439024, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 1.0604, "eval_samples_per_second": 176.347, "eval_steps_per_second": 2.829, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.8303266167640686, "learning_rate": 4.15e-05, "loss": 0.0811, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7499999999999999, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6741573033707865, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13409367203712463, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8095872170439414, "eval_overall_precision": 0.7524752475247525, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0536, "eval_samples_per_second": 177.488, "eval_steps_per_second": 2.847, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.8499922752380371, "learning_rate": 4.1e-05, "loss": 0.0779, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.7421383647798742, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6704545454545454, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7402597402597403, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6404494382022472, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6842105263157895, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6046511627906976, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.7540983606557378, "eval_TIME_number": 28, "eval_TIME_precision": 0.696969696969697, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.14901402592658997, "eval_overall_accuracy": 0.9529582929194956, "eval_overall_f1": 0.799475753604194, "eval_overall_precision": 0.7331730769230769, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0609, "eval_samples_per_second": 176.262, "eval_steps_per_second": 2.828, "step": 1908 }, { "epoch": 19.0, "grad_norm": 1.0185816287994385, "learning_rate": 4.05e-05, "loss": 0.0748, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.7516778523489933, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.717948717948718, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8990228013029316, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8789808917197452, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8285714285714285, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7837837837837838, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12444239854812622, "eval_overall_accuracy": 0.9624151309408342, "eval_overall_f1": 0.8296703296703296, "eval_overall_precision": 0.7926509186351706, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.0625, "eval_samples_per_second": 176.0, "eval_steps_per_second": 2.824, "step": 2014 }, { "epoch": 20.0, "grad_norm": 1.3024747371673584, "learning_rate": 4e-05, "loss": 0.073, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7832167832167831, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.717948717948718, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8450704225352113, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7894736842105263, "eval_QUANTITY_recall": 0.9090909090909091, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12432579696178436, "eval_overall_accuracy": 0.9645974781765276, "eval_overall_f1": 0.8422496570644719, "eval_overall_precision": 0.8036649214659686, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.0561, "eval_samples_per_second": 177.074, "eval_steps_per_second": 2.841, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.8448452949523926, "learning_rate": 3.9500000000000005e-05, "loss": 0.0694, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.7421383647798742, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6704545454545454, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7073170731707317, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5858585858585859, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9096774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.88125, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.675, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.574468085106383, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8070175438596492, "eval_TIME_number": 28, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.1571197509765625, "eval_overall_accuracy": 0.9522308438409312, "eval_overall_f1": 0.8, "eval_overall_precision": 0.7281323877068558, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 1.0507, "eval_samples_per_second": 177.981, "eval_steps_per_second": 2.855, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.6756930947303772, "learning_rate": 3.9000000000000006e-05, "loss": 0.0655, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.7643312101910827, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6976744186046512, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8802588996763754, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1396949291229248, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8129205921938089, "eval_overall_precision": 0.7626262626262627, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.046, "eval_samples_per_second": 178.78, "eval_steps_per_second": 2.868, "step": 2332 }, { "epoch": 23.0, "grad_norm": 1.0572928190231323, "learning_rate": 3.85e-05, "loss": 0.0623, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8070175438596492, "eval_TIME_number": 28, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.13910295069217682, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8221024258760108, "eval_overall_precision": 0.7721518987341772, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0543, "eval_samples_per_second": 177.367, "eval_steps_per_second": 2.845, "step": 2438 }, { "epoch": 24.0, "grad_norm": 0.8183007836341858, "learning_rate": 3.8e-05, "loss": 0.0588, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7374999999999999, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6629213483146067, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14739328622817993, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8106666666666668, "eval_overall_precision": 0.7543424317617866, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0524, "eval_samples_per_second": 177.697, "eval_steps_per_second": 2.851, "step": 2544 }, { "epoch": 25.0, "grad_norm": 1.561627984046936, "learning_rate": 3.7500000000000003e-05, "loss": 0.0602, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.751592356687898, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.686046511627907, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7402597402597403, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6404494382022472, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8363636363636364, "eval_TIME_number": 28, "eval_TIME_precision": 0.8518518518518519, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.14714130759239197, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.8149134487350199, "eval_overall_precision": 0.7574257425742574, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0522, "eval_samples_per_second": 177.728, "eval_steps_per_second": 2.851, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.37913623452186584, "learning_rate": 3.7e-05, "loss": 0.0543, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.7547169811320754, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6818181818181818, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.757142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7066666666666667, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7179487179487178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6222222222222222, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.793103448275862, "eval_TIME_number": 28, "eval_TIME_precision": 0.7666666666666667, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.1607346087694168, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8085676037483265, "eval_overall_precision": 0.755, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.0494, "eval_samples_per_second": 178.198, "eval_steps_per_second": 2.859, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.6127158403396606, "learning_rate": 3.65e-05, "loss": 0.0555, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7368421052631579, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6436781609195402, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9055374592833875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8853503184713376, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8214285714285714, "eval_TIME_number": 28, "eval_TIME_precision": 0.8214285714285714, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.14687323570251465, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8183041722745625, "eval_overall_precision": 0.7676767676767676, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0568, "eval_samples_per_second": 176.954, "eval_steps_per_second": 2.839, "step": 2862 }, { "epoch": 28.0, "grad_norm": 1.0716761350631714, "learning_rate": 3.6e-05, "loss": 0.0507, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7295597484276729, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6170212765957447, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7027027027027027, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6341463414634146, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15819337964057922, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7611940298507462, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0494, "eval_samples_per_second": 178.203, "eval_steps_per_second": 2.859, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.6914520263671875, "learning_rate": 3.55e-05, "loss": 0.0512, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.686046511627907, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5514018691588785, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16121703386306763, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8031496062992126, "eval_overall_precision": 0.7373493975903614, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0541, "eval_samples_per_second": 177.397, "eval_steps_per_second": 2.846, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.9099843502044678, "learning_rate": 3.5e-05, "loss": 0.047, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9078947368421053, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8961038961038961, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8363636363636364, "eval_TIME_number": 28, "eval_TIME_precision": 0.8518518518518519, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.1513780951499939, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8247978436657682, "eval_overall_precision": 0.7746835443037975, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.1364, "eval_samples_per_second": 164.552, "eval_steps_per_second": 2.64, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.5555219054222107, "learning_rate": 3.45e-05, "loss": 0.0466, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.7483870967741935, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6904761904761905, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9025974025974027, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.879746835443038, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15754006803035736, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.827027027027027, "eval_overall_precision": 0.7786259541984732, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0609, "eval_samples_per_second": 176.262, "eval_steps_per_second": 2.828, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.21328239142894745, "learning_rate": 3.4000000000000007e-05, "loss": 0.0449, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7295597484276729, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6170212765957447, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17104628682136536, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7611940298507462, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.2405, "eval_samples_per_second": 150.742, "eval_steps_per_second": 2.418, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.6623594760894775, "learning_rate": 3.35e-05, "loss": 0.0414, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.7532467532467533, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6987951807228916, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.654320987654321, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8831168831168831, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8607594936708861, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1599014401435852, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8163265306122449, "eval_overall_precision": 0.7731958762886598, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 1.051, "eval_samples_per_second": 177.926, "eval_steps_per_second": 2.854, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.7860094308853149, "learning_rate": 3.3e-05, "loss": 0.0425, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.7662337662337662, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8692810457516339, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8525641025641025, "eval_PERSON_recall": 0.8866666666666667, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1540924459695816, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8108108108108107, "eval_overall_precision": 0.7633587786259542, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 1.0533, "eval_samples_per_second": 177.543, "eval_steps_per_second": 2.848, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.8806631565093994, "learning_rate": 3.2500000000000004e-05, "loss": 0.0389, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.729559748427673, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6590909090909091, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7388535031847134, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6304347826086957, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7419354838709677, "eval_TIME_number": 28, "eval_TIME_precision": 0.6764705882352942, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.19029554724693298, "eval_overall_accuracy": 0.9522308438409312, "eval_overall_f1": 0.799475753604194, "eval_overall_precision": 0.7331730769230769, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0532, "eval_samples_per_second": 177.547, "eval_steps_per_second": 2.848, "step": 3710 }, { "epoch": 36.0, "grad_norm": 1.029179334640503, "learning_rate": 3.2000000000000005e-05, "loss": 0.0389, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.7662337662337662, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7169811320754718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6063829787234043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17856962978839874, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8164893617021276, "eval_overall_precision": 0.7580246913580246, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.0617, "eval_samples_per_second": 176.128, "eval_steps_per_second": 2.826, "step": 3816 }, { "epoch": 37.0, "grad_norm": 1.0397053956985474, "learning_rate": 3.15e-05, "loss": 0.0369, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.725, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.651685393258427, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7341772151898733, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6236559139784946, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20172427594661713, "eval_overall_accuracy": 0.9529582929194956, "eval_overall_f1": 0.8067885117493473, "eval_overall_precision": 0.7374701670644391, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 1.0533, "eval_samples_per_second": 177.542, "eval_steps_per_second": 2.848, "step": 3922 }, { "epoch": 38.0, "grad_norm": 1.4343793392181396, "learning_rate": 3.1e-05, "loss": 0.0362, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.7612903225806451, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1783708781003952, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8141112618724559, "eval_overall_precision": 0.7692307692307693, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 1.0559, "eval_samples_per_second": 177.107, "eval_steps_per_second": 2.841, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.2365792840719223, "learning_rate": 3.05e-05, "loss": 0.034, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.76, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6705882352941176, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.17429344356060028, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8265582655826558, "eval_overall_precision": 0.7800511508951407, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0434, "eval_samples_per_second": 179.224, "eval_steps_per_second": 2.875, "step": 4134 }, { "epoch": 40.0, "grad_norm": 1.8789796829223633, "learning_rate": 3e-05, "loss": 0.0342, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1677405685186386, "eval_overall_accuracy": 0.9624151309408342, "eval_overall_f1": 0.8335588633288228, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 1.0476, "eval_samples_per_second": 178.511, "eval_steps_per_second": 2.864, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.3054400086402893, "learning_rate": 2.95e-05, "loss": 0.0325, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.759493670886076, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6896551724137931, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7581699346405228, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6590909090909091, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19720277190208435, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.816976127320955, "eval_overall_precision": 0.7567567567567568, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 1.0527, "eval_samples_per_second": 177.643, "eval_steps_per_second": 2.85, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.7684195637702942, "learning_rate": 2.9e-05, "loss": 0.0304, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.18190883100032806, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8184281842818427, "eval_overall_precision": 0.7723785166240409, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.0594, "eval_samples_per_second": 176.508, "eval_steps_per_second": 2.832, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.31616175174713135, "learning_rate": 2.8499999999999998e-05, "loss": 0.0295, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19346393644809723, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8183041722745625, "eval_overall_precision": 0.7676767676767676, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0521, "eval_samples_per_second": 177.732, "eval_steps_per_second": 2.851, "step": 4558 }, { "epoch": 44.0, "grad_norm": 2.207120418548584, "learning_rate": 2.8000000000000003e-05, "loss": 0.0301, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7307692307692307, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6263736263736264, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19700577855110168, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 1.0474, "eval_samples_per_second": 178.541, "eval_steps_per_second": 2.864, "step": 4664 }, { "epoch": 45.0, "grad_norm": 0.8179439902305603, "learning_rate": 2.7500000000000004e-05, "loss": 0.0291, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7862068965517242, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7125, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19478309154510498, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 1.1283, "eval_samples_per_second": 165.73, "eval_steps_per_second": 2.659, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.5856307148933411, "learning_rate": 2.7000000000000002e-05, "loss": 0.0274, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7785234899328859, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6904761904761905, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8910891089108911, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8823529411764706, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.18428590893745422, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8299319727891157, "eval_overall_precision": 0.7860824742268041, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0545, "eval_samples_per_second": 177.342, "eval_steps_per_second": 2.845, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.8249619007110596, "learning_rate": 2.6500000000000004e-05, "loss": 0.0249, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2020081728696823, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8187919463087249, "eval_overall_precision": 0.7663316582914573, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0517, "eval_samples_per_second": 177.806, "eval_steps_per_second": 2.853, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.4953243732452393, "learning_rate": 2.6000000000000002e-05, "loss": 0.0259, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7857142857142856, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7333333333333333, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.18837600946426392, "eval_overall_accuracy": 0.9629000969932104, "eval_overall_f1": 0.8333333333333333, "eval_overall_precision": 0.7922077922077922, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0473, "eval_samples_per_second": 178.558, "eval_steps_per_second": 2.865, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.07555894553661346, "learning_rate": 2.5500000000000003e-05, "loss": 0.0252, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7746478873239436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.821917808219178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.9090909090909091, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.18851637840270996, "eval_overall_accuracy": 0.9626576139670223, "eval_overall_f1": 0.8410958904109589, "eval_overall_precision": 0.8015665796344648, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.0481, "eval_samples_per_second": 178.415, "eval_steps_per_second": 2.862, "step": 5194 }, { "epoch": 50.0, "grad_norm": 2.4923367500305176, "learning_rate": 2.5e-05, "loss": 0.0243, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7659574468085107, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7105263157894737, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19272957742214203, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8328767123287671, "eval_overall_precision": 0.793733681462141, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0636, "eval_samples_per_second": 175.82, "eval_steps_per_second": 2.821, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.5428743362426758, "learning_rate": 2.45e-05, "loss": 0.0239, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7483870967741935, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6904761904761905, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7482993197278912, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6707317073170732, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20626060664653778, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8134228187919462, "eval_overall_precision": 0.7613065326633166, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 1.0562, "eval_samples_per_second": 177.052, "eval_steps_per_second": 2.84, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.7587451934814453, "learning_rate": 2.4e-05, "loss": 0.0238, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8954248366013071, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8782051282051282, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2040700912475586, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8276797829036635, "eval_overall_precision": 0.782051282051282, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0567, "eval_samples_per_second": 176.964, "eval_steps_per_second": 2.839, "step": 5512 }, { "epoch": 53.0, "grad_norm": 0.7874153852462769, "learning_rate": 2.35e-05, "loss": 0.0219, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8954248366013071, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8782051282051282, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19597817957401276, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8337874659400545, "eval_overall_precision": 0.7906976744186046, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0499, "eval_samples_per_second": 178.109, "eval_steps_per_second": 2.857, "step": 5618 }, { "epoch": 54.0, "grad_norm": 1.4033691883087158, "learning_rate": 2.3000000000000003e-05, "loss": 0.0237, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7651006711409396, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6785714285714286, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19870668649673462, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8342391304347825, "eval_overall_precision": 0.7892030848329049, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.0458, "eval_samples_per_second": 178.803, "eval_steps_per_second": 2.869, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.2151368260383606, "learning_rate": 2.25e-05, "loss": 0.021, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7468354430379748, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6344086021505376, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.22194057703018188, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8126649076517151, "eval_overall_precision": 0.7493917274939172, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 1.0535, "eval_samples_per_second": 177.497, "eval_steps_per_second": 2.848, "step": 5830 }, { "epoch": 56.0, "grad_norm": 1.3246495723724365, "learning_rate": 2.2000000000000003e-05, "loss": 0.021, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7199999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6352941176470588, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8766233766233766, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8544303797468354, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20850205421447754, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8091397849462366, "eval_overall_precision": 0.7581863979848866, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.0545, "eval_samples_per_second": 177.338, "eval_steps_per_second": 2.845, "step": 5936 }, { "epoch": 57.0, "grad_norm": 1.0762540102005005, "learning_rate": 2.15e-05, "loss": 0.0203, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.76056338028169, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7012987012987013, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2009107619524002, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8276797829036635, "eval_overall_precision": 0.782051282051282, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0514, "eval_samples_per_second": 177.857, "eval_steps_per_second": 2.853, "step": 6042 }, { "epoch": 58.0, "grad_norm": 1.3385218381881714, "learning_rate": 2.1e-05, "loss": 0.0196, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1974872499704361, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8190476190476191, "eval_overall_precision": 0.7757731958762887, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.06, "eval_samples_per_second": 176.42, "eval_steps_per_second": 2.83, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.45897576212882996, "learning_rate": 2.05e-05, "loss": 0.0195, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7777777777777778, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7088607594936709, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20014727115631104, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.830393487109905, "eval_overall_precision": 0.7846153846153846, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0622, "eval_samples_per_second": 176.051, "eval_steps_per_second": 2.824, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.07298379391431808, "learning_rate": 2e-05, "loss": 0.0188, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7801418439716312, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7236842105263158, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8954248366013071, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8782051282051282, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19487623870372772, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8363136176066025, "eval_overall_precision": 0.8, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0468, "eval_samples_per_second": 178.634, "eval_steps_per_second": 2.866, "step": 6360 }, { "epoch": 61.0, "grad_norm": 3.493285655975342, "learning_rate": 1.9500000000000003e-05, "loss": 0.0197, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20809414982795715, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.827027027027027, "eval_overall_precision": 0.7786259541984732, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.04, "eval_samples_per_second": 179.808, "eval_steps_per_second": 2.885, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.8092681169509888, "learning_rate": 1.9e-05, "loss": 0.0173, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8990228013029316, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8789808917197452, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20864509046077728, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8308525033829499, "eval_overall_precision": 0.7831632653061225, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.0523, "eval_samples_per_second": 177.712, "eval_steps_per_second": 2.851, "step": 6572 }, { "epoch": 63.0, "grad_norm": 2.9163479804992676, "learning_rate": 1.85e-05, "loss": 0.0169, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7466666666666668, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6588235294117647, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8918032786885245, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8774193548387097, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20584411919116974, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8299319727891157, "eval_overall_precision": 0.7860824742268041, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0618, "eval_samples_per_second": 176.115, "eval_steps_per_second": 2.825, "step": 6678 }, { "epoch": 64.0, "grad_norm": 1.6419179439544678, "learning_rate": 1.8e-05, "loss": 0.0173, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.8, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7714285714285715, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8852459016393444, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8709677419354839, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20184890925884247, "eval_overall_accuracy": 0.9631425800193987, "eval_overall_f1": 0.8372739916550765, "eval_overall_precision": 0.8091397849462365, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.1318, "eval_samples_per_second": 165.226, "eval_steps_per_second": 2.651, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.9246335029602051, "learning_rate": 1.75e-05, "loss": 0.0149, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.757142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7066666666666667, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20779463648796082, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8278688524590164, "eval_overall_precision": 0.787012987012987, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 1.0499, "eval_samples_per_second": 178.113, "eval_steps_per_second": 2.857, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.29005441069602966, "learning_rate": 1.7000000000000003e-05, "loss": 0.0155, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8990228013029316, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8789808917197452, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22765351831912994, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8259109311740891, "eval_overall_precision": 0.7766497461928934, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0539, "eval_samples_per_second": 177.432, "eval_steps_per_second": 2.847, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.15708033740520477, "learning_rate": 1.65e-05, "loss": 0.0166, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8996763754045306, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21828927099704742, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8260869565217391, "eval_overall_precision": 0.781491002570694, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0465, "eval_samples_per_second": 178.691, "eval_steps_per_second": 2.867, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.745664656162262, "learning_rate": 1.6000000000000003e-05, "loss": 0.0158, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.7564102564102564, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6941176470588235, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.2362554669380188, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8225806451612904, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0542, "eval_samples_per_second": 177.388, "eval_steps_per_second": 2.846, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.1767091453075409, "learning_rate": 1.55e-05, "loss": 0.0155, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8802588996763754, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.821917808219178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.9090909090909091, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21981391310691833, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8281461434370772, "eval_overall_precision": 0.7806122448979592, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0623, "eval_samples_per_second": 176.036, "eval_steps_per_second": 2.824, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.2924017906188965, "learning_rate": 1.5e-05, "loss": 0.0155, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7368421052631579, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6436781609195402, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9055374592833875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8853503184713376, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2236405611038208, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8274932614555257, "eval_overall_precision": 0.7772151898734178, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.0549, "eval_samples_per_second": 177.26, "eval_steps_per_second": 2.844, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.8644899129867554, "learning_rate": 1.45e-05, "loss": 0.0158, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.7564102564102564, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6941176470588235, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7096774193548387, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9025974025974027, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.879746835443038, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23344790935516357, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7630922693266833, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.1196, "eval_samples_per_second": 167.021, "eval_steps_per_second": 2.679, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.4155713617801666, "learning_rate": 1.4000000000000001e-05, "loss": 0.0155, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7746478873239436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8859934853420196, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8662420382165605, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21206453442573547, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8278688524590164, "eval_overall_precision": 0.787012987012987, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 1.0476, "eval_samples_per_second": 178.503, "eval_steps_per_second": 2.864, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.16996408998966217, "learning_rate": 1.3500000000000001e-05, "loss": 0.0136, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6708860759493671, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23162654042243958, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8238482384823849, "eval_overall_precision": 0.7774936061381074, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0665, "eval_samples_per_second": 175.338, "eval_steps_per_second": 2.813, "step": 7738 }, { "epoch": 74.0, "grad_norm": 1.7051116228103638, "learning_rate": 1.3000000000000001e-05, "loss": 0.0134, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7857142857142856, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7333333333333333, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22262556850910187, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8379120879120878, "eval_overall_precision": 0.800524934383202, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0491, "eval_samples_per_second": 178.241, "eval_steps_per_second": 2.859, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.22455532848834991, "learning_rate": 1.25e-05, "loss": 0.0139, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7887323943661972, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7272727272727273, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21403230726718903, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8356164383561643, "eval_overall_precision": 0.7963446475195822, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0631, "eval_samples_per_second": 175.908, "eval_steps_per_second": 2.822, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.007820017635822296, "learning_rate": 1.2e-05, "loss": 0.0142, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7746478873239436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22380225360393524, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8315217391304348, "eval_overall_precision": 0.7866323907455013, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0493, "eval_samples_per_second": 178.206, "eval_steps_per_second": 2.859, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.41897082328796387, "learning_rate": 1.1500000000000002e-05, "loss": 0.014, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.757142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7066666666666667, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.8169014084507042, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7631578947368421, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21939164400100708, "eval_overall_accuracy": 0.9636275460717749, "eval_overall_f1": 0.834924965893588, "eval_overall_precision": 0.7927461139896373, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0552, "eval_samples_per_second": 177.225, "eval_steps_per_second": 2.843, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.47026127576828003, "learning_rate": 1.1000000000000001e-05, "loss": 0.0126, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22609065473079681, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8310626702997276, "eval_overall_precision": 0.7881136950904393, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.052, "eval_samples_per_second": 177.752, "eval_steps_per_second": 2.852, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.9084616899490356, "learning_rate": 1.05e-05, "loss": 0.0125, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7586206896551724, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.232786163687706, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8281461434370772, "eval_overall_precision": 0.7806122448979592, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0606, "eval_samples_per_second": 176.309, "eval_steps_per_second": 2.828, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.3104639947414398, "learning_rate": 1e-05, "loss": 0.0123, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23563723266124725, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8247978436657682, "eval_overall_precision": 0.7746835443037975, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0481, "eval_samples_per_second": 178.419, "eval_steps_per_second": 2.862, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.09613505750894547, "learning_rate": 9.5e-06, "loss": 0.0121, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7857142857142856, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7333333333333333, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8852459016393444, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8709677419354839, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21699251234531403, "eval_overall_accuracy": 0.9633850630455868, "eval_overall_f1": 0.8335625859697388, "eval_overall_precision": 0.7973684210526316, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 1.0455, "eval_samples_per_second": 178.863, "eval_steps_per_second": 2.869, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.2361814975738525, "learning_rate": 9e-06, "loss": 0.0124, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7397260273972603, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23771944642066956, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8259109311740891, "eval_overall_precision": 0.7766497461928934, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0536, "eval_samples_per_second": 177.487, "eval_steps_per_second": 2.847, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.15847894549369812, "learning_rate": 8.500000000000002e-06, "loss": 0.0123, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7397260273972603, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2313675880432129, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.827027027027027, "eval_overall_precision": 0.7786259541984732, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0661, "eval_samples_per_second": 175.406, "eval_steps_per_second": 2.814, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.36980700492858887, "learning_rate": 8.000000000000001e-06, "loss": 0.0121, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7746478873239436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21659883856773376, "eval_overall_accuracy": 0.9636275460717749, "eval_overall_f1": 0.8387978142076504, "eval_overall_precision": 0.7974025974025974, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 1.055, "eval_samples_per_second": 177.255, "eval_steps_per_second": 2.844, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.6816823482513428, "learning_rate": 7.5e-06, "loss": 0.0122, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.24010856449604034, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.82907133243607, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 1.0528, "eval_samples_per_second": 177.616, "eval_steps_per_second": 2.849, "step": 9010 }, { "epoch": 86.0, "grad_norm": 1.010087490081787, "learning_rate": 7.000000000000001e-06, "loss": 0.012, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7746478873239436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.894736842105263, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8831168831168831, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2242480218410492, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8340192043895748, "eval_overall_precision": 0.7958115183246073, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0597, "eval_samples_per_second": 176.469, "eval_steps_per_second": 2.831, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.7689788937568665, "learning_rate": 6.5000000000000004e-06, "loss": 0.0112, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8996763754045306, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2339707463979721, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.827027027027027, "eval_overall_precision": 0.7786259541984732, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 1.0569, "eval_samples_per_second": 176.936, "eval_steps_per_second": 2.839, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.36982235312461853, "learning_rate": 6e-06, "loss": 0.0109, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22819143533706665, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8217687074829931, "eval_overall_precision": 0.7783505154639175, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.0643, "eval_samples_per_second": 175.699, "eval_steps_per_second": 2.819, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.2916944622993469, "learning_rate": 5.500000000000001e-06, "loss": 0.0105, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2318750023841858, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8288043478260869, "eval_overall_precision": 0.7840616966580977, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0577, "eval_samples_per_second": 176.795, "eval_steps_per_second": 2.836, "step": 9434 }, { "epoch": 90.0, "grad_norm": 0.37730202078819275, "learning_rate": 5e-06, "loss": 0.0098, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8990228013029316, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8789808917197452, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23395000398159027, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8276797829036635, "eval_overall_precision": 0.782051282051282, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0495, "eval_samples_per_second": 178.178, "eval_steps_per_second": 2.858, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.6458882689476013, "learning_rate": 4.5e-06, "loss": 0.0109, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7586206896551724, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22991229593753815, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8310626702997276, "eval_overall_precision": 0.7881136950904393, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 1.0583, "eval_samples_per_second": 176.704, "eval_steps_per_second": 2.835, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.31122303009033203, "learning_rate": 4.000000000000001e-06, "loss": 0.0114, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23025508224964142, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8190476190476191, "eval_overall_precision": 0.7757731958762887, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.046, "eval_samples_per_second": 178.77, "eval_steps_per_second": 2.868, "step": 9752 }, { "epoch": 93.0, "grad_norm": 1.2301055192947388, "learning_rate": 3.5000000000000004e-06, "loss": 0.0104, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23245875537395477, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8189189189189189, "eval_overall_precision": 0.7709923664122137, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 1.0547, "eval_samples_per_second": 177.306, "eval_steps_per_second": 2.844, "step": 9858 }, { "epoch": 94.0, "grad_norm": 1.0476171970367432, "learning_rate": 3e-06, "loss": 0.0099, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23353543877601624, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8179347826086958, "eval_overall_precision": 0.7737789203084833, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.0587, "eval_samples_per_second": 176.634, "eval_steps_per_second": 2.834, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.6297835111618042, "learning_rate": 2.5e-06, "loss": 0.0115, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7310344827586207, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6625, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.24176815152168274, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8173207036535859, "eval_overall_precision": 0.7704081632653061, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.0575, "eval_samples_per_second": 176.827, "eval_steps_per_second": 2.837, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.7284921407699585, "learning_rate": 2.0000000000000003e-06, "loss": 0.009, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6708860759493671, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.23633427917957306, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8179347826086958, "eval_overall_precision": 0.7737789203084833, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.0622, "eval_samples_per_second": 176.042, "eval_steps_per_second": 2.824, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.8745085000991821, "learning_rate": 1.5e-06, "loss": 0.0104, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8996763754045306, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2431822121143341, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8194070080862534, "eval_overall_precision": 0.769620253164557, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 1.0389, "eval_samples_per_second": 180.0, "eval_steps_per_second": 2.888, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.7874897122383118, "learning_rate": 1.0000000000000002e-06, "loss": 0.0104, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6708860759493671, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2386394888162613, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8179347826086958, "eval_overall_precision": 0.7737789203084833, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 1.0472, "eval_samples_per_second": 178.565, "eval_steps_per_second": 2.865, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.21786460280418396, "learning_rate": 5.000000000000001e-07, "loss": 0.0106, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7397260273972603, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.24056798219680786, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8200270635994588, "eval_overall_precision": 0.7729591836734694, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 1.0478, "eval_samples_per_second": 178.469, "eval_steps_per_second": 2.863, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.5074381828308105, "learning_rate": 0.0, "loss": 0.0093, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7397260273972603, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.24040785431861877, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8173207036535859, "eval_overall_precision": 0.7704081632653061, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 1.05, "eval_samples_per_second": 178.101, "eval_steps_per_second": 2.857, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5189413292285520.0, "train_loss": 0.05698325344414081, "train_runtime": 1582.8095, "train_samples_per_second": 106.646, "train_steps_per_second": 6.697 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5189413292285520.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }