{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 0.9845661520957947, "learning_rate": 4.9500000000000004e-05, "loss": 0.9292, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.012903225806451613, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.3333333333333333, "eval_PERSON_recall": 0.006578947368421052, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 29, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.6127339601516724, "eval_overall_accuracy": 0.8399487836107554, "eval_overall_f1": 0.005865102639296187, "eval_overall_precision": 0.3333333333333333, "eval_overall_recall": 0.0029585798816568047, "eval_runtime": 0.7389, "eval_samples_per_second": 253.078, "eval_steps_per_second": 4.06, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.0367096662521362, "learning_rate": 4.9e-05, "loss": 0.5076, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.3577235772357724, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.4074074074074074, "eval_LOCATION_recall": 0.3188405797101449, "eval_ORGANIZATION_f1": 0.11235955056179776, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.16129032258064516, "eval_ORGANIZATION_recall": 0.08620689655172414, "eval_PERSON_f1": 0.6703601108033241, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.5789473684210527, "eval_PERSON_recall": 0.7960526315789473, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.4918032786885246, "eval_TIME_number": 29, "eval_TIME_precision": 0.46875, "eval_TIME_recall": 0.5172413793103449, "eval_loss": 0.33459725975990295, "eval_overall_accuracy": 0.9044814340588988, "eval_overall_f1": 0.48082595870206496, "eval_overall_precision": 0.47941176470588237, "eval_overall_recall": 0.4822485207100592, "eval_runtime": 0.7528, "eval_samples_per_second": 248.397, "eval_steps_per_second": 3.985, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.3818385601043701, "learning_rate": 4.85e-05, "loss": 0.2907, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.6705882352941176, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5643564356435643, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.39682539682539686, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.36764705882352944, "eval_ORGANIZATION_recall": 0.43103448275862066, "eval_PERSON_f1": 0.8085106382978723, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.751412429378531, "eval_PERSON_recall": 0.875, "eval_QUANTITY_f1": 0.605263157894737, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5, "eval_QUANTITY_recall": 0.7666666666666667, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1991610825061798, "eval_overall_accuracy": 0.9323943661971831, "eval_overall_f1": 0.6885676741130091, "eval_overall_precision": 0.6193853427895981, "eval_overall_recall": 0.7751479289940828, "eval_runtime": 0.7451, "eval_samples_per_second": 250.989, "eval_steps_per_second": 4.027, "step": 318 }, { "epoch": 4.0, "grad_norm": 2.382436513900757, "learning_rate": 4.8e-05, "loss": 0.1931, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.7875, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6923076923076923, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6323529411764706, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5512820512820513, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.7896253602305474, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7025641025641025, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.6410256410256411, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5208333333333334, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.6133333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.5, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.190628781914711, "eval_overall_accuracy": 0.9352112676056338, "eval_overall_f1": 0.7311557788944725, "eval_overall_precision": 0.6353711790393013, "eval_overall_recall": 0.8609467455621301, "eval_runtime": 0.7563, "eval_samples_per_second": 247.259, "eval_steps_per_second": 3.967, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.9061810970306396, "learning_rate": 4.75e-05, "loss": 0.1671, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7832167832167832, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7567567567567568, "eval_LOCATION_recall": 0.8115942028985508, "eval_ORGANIZATION_f1": 0.6714285714285714, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.573170731707317, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8535825545171339, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8106508875739645, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13657993078231812, "eval_overall_accuracy": 0.953393085787452, "eval_overall_f1": 0.7978142076502731, "eval_overall_precision": 0.7411167512690355, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.768, "eval_samples_per_second": 243.498, "eval_steps_per_second": 3.906, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.6724838018417358, "learning_rate": 4.7e-05, "loss": 0.1438, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7564102564102564, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6781609195402298, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6231884057971016, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5375, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8430769230769231, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.791907514450867, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7246376811594204, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.71875, "eval_TIME_number": 29, "eval_TIME_precision": 0.6571428571428571, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.13694226741790771, "eval_overall_accuracy": 0.9528809218950064, "eval_overall_f1": 0.7632978723404256, "eval_overall_precision": 0.6932367149758454, "eval_overall_recall": 0.849112426035503, "eval_runtime": 0.846, "eval_samples_per_second": 221.028, "eval_steps_per_second": 3.546, "step": 636 }, { "epoch": 7.0, "grad_norm": 0.49843528866767883, "learning_rate": 4.6500000000000005e-05, "loss": 0.1337, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6557377049180328, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.6896551724137931, "eval_PERSON_f1": 0.8679245283018868, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8313253012048193, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.12538817524909973, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.796116504854369, "eval_overall_precision": 0.7493472584856397, "eval_overall_recall": 0.849112426035503, "eval_runtime": 0.8252, "eval_samples_per_second": 226.607, "eval_steps_per_second": 3.635, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.4025654196739197, "learning_rate": 4.600000000000001e-05, "loss": 0.1244, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.8275862068965517, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7894736842105263, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6825396825396826, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6323529411764706, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8769716088328074, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.6875, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6470588235294118, "eval_QUANTITY_recall": 0.7333333333333333, "eval_TIME_f1": 0.7540983606557378, "eval_TIME_number": 29, "eval_TIME_precision": 0.71875, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.12903648614883423, "eval_overall_accuracy": 0.9572343149807938, "eval_overall_f1": 0.8050490883590464, "eval_overall_precision": 0.7653333333333333, "eval_overall_recall": 0.849112426035503, "eval_runtime": 0.8305, "eval_samples_per_second": 225.153, "eval_steps_per_second": 3.612, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.2503007650375366, "learning_rate": 4.55e-05, "loss": 0.1195, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6285714285714286, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8598130841121495, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8165680473372781, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8064516129032258, "eval_TIME_number": 29, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.12411422282457352, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8093922651933702, "eval_overall_precision": 0.7590673575129534, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8548, "eval_samples_per_second": 218.761, "eval_steps_per_second": 3.51, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.5948196649551392, "learning_rate": 4.5e-05, "loss": 0.1083, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6285714285714286, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8761904761904762, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.12625408172607422, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8099861303744799, "eval_overall_precision": 0.762402088772846, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.9354, "eval_samples_per_second": 199.908, "eval_steps_per_second": 3.207, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.7792600393295288, "learning_rate": 4.4500000000000004e-05, "loss": 0.1025, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7441860465116279, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7040000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6567164179104478, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.64, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5333333333333333, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14459605515003204, "eval_overall_accuracy": 0.9551856594110115, "eval_overall_f1": 0.8071135430916553, "eval_overall_precision": 0.7506361323155216, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.9057, "eval_samples_per_second": 206.46, "eval_steps_per_second": 3.312, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.0304011106491089, "learning_rate": 4.4000000000000006e-05, "loss": 0.0969, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6991869918699186, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6615384615384615, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1326281726360321, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8111888111888113, "eval_overall_precision": 0.7692307692307693, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.875, "eval_samples_per_second": 213.704, "eval_steps_per_second": 3.428, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.34425103664398193, "learning_rate": 4.35e-05, "loss": 0.0885, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.821917808219178, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7040000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6567164179104478, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.11661401391029358, "eval_overall_accuracy": 0.9626120358514725, "eval_overall_f1": 0.8316831683168318, "eval_overall_precision": 0.7967479674796748, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8754, "eval_samples_per_second": 213.615, "eval_steps_per_second": 3.427, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.0210072994232178, "learning_rate": 4.3e-05, "loss": 0.0897, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.8322147651006713, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6825396825396826, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6323529411764706, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8734177215189874, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7272727272727273, "eval_TIME_number": 29, "eval_TIME_precision": 0.6486486486486487, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1263030618429184, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8099861303744799, "eval_overall_precision": 0.762402088772846, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.9149, "eval_samples_per_second": 204.387, "eval_steps_per_second": 3.279, "step": 1484 }, { "epoch": 15.0, "grad_norm": 0.7929083704948425, "learning_rate": 4.25e-05, "loss": 0.0847, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6721311475409836, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.640625, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.12834492325782776, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8123249299719889, "eval_overall_precision": 0.7712765957446809, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.8739, "eval_samples_per_second": 213.989, "eval_steps_per_second": 3.433, "step": 1590 }, { "epoch": 16.0, "grad_norm": 0.8108320236206055, "learning_rate": 4.2e-05, "loss": 0.0808, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8299319727891156, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7040000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6567164179104478, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8874598070739551, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.761904761904762, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7272727272727273, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.12765684723854065, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.826025459688826, "eval_overall_precision": 0.7913279132791328, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.8873, "eval_samples_per_second": 210.758, "eval_steps_per_second": 3.381, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.31881314516067505, "learning_rate": 4.15e-05, "loss": 0.0746, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.8266666666666668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7086614173228347, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6521739130434783, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8874598070739551, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13274899125099182, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8218793828892006, "eval_overall_precision": 0.7813333333333333, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8878, "eval_samples_per_second": 210.626, "eval_steps_per_second": 3.379, "step": 1802 }, { "epoch": 18.0, "grad_norm": 1.1737678050994873, "learning_rate": 4.1e-05, "loss": 0.0715, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8671328671328672, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8726114649681528, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1314823478460312, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8215297450424929, "eval_overall_precision": 0.7880434782608695, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.8811, "eval_samples_per_second": 212.231, "eval_steps_per_second": 3.405, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.9921818971633911, "learning_rate": 4.05e-05, "loss": 0.0695, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8378378378378378, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7213114754098361, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7164179104477612, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7936507936507937, "eval_TIME_number": 29, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1310775727033615, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.8190743338008415, "eval_overall_precision": 0.7786666666666666, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.8843, "eval_samples_per_second": 211.462, "eval_steps_per_second": 3.392, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.8729901909828186, "learning_rate": 4e-05, "loss": 0.0705, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.851063829787234, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8333333333333334, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8761904761904762, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13000606000423431, "eval_overall_accuracy": 0.9597951344430218, "eval_overall_f1": 0.8238636363636365, "eval_overall_precision": 0.7923497267759563, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.87, "eval_samples_per_second": 214.936, "eval_steps_per_second": 3.448, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.5570505857467651, "learning_rate": 3.9500000000000005e-05, "loss": 0.0623, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.8590604026845639, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7076923076923076, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6388888888888888, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.89171974522293, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14154018461704254, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.8347338935574229, "eval_overall_precision": 0.7925531914893617, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.892, "eval_samples_per_second": 209.65, "eval_steps_per_second": 3.363, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.4297601878643036, "learning_rate": 3.9000000000000006e-05, "loss": 0.0636, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.8366013071895425, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.706766917293233, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6266666666666667, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8761904761904762, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7812500000000001, "eval_TIME_number": 29, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14867202937602997, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.8175582990397806, "eval_overall_precision": 0.7621483375959079, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8724, "eval_samples_per_second": 214.362, "eval_steps_per_second": 3.439, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.4904947876930237, "learning_rate": 3.85e-05, "loss": 0.0571, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8591549295774648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8356164383561644, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7131782945736435, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.647887323943662, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8607594936708861, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1371629238128662, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8283687943262411, "eval_overall_precision": 0.7956403269754768, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.8758, "eval_samples_per_second": 213.508, "eval_steps_per_second": 3.425, "step": 2438 }, { "epoch": 24.0, "grad_norm": 0.8735907673835754, "learning_rate": 3.8e-05, "loss": 0.0574, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.696969696969697, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6216216216216216, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8881789137380192, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8275862068965517, "eval_TIME_number": 29, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14183317124843597, "eval_overall_accuracy": 0.9626120358514725, "eval_overall_f1": 0.8286516853932584, "eval_overall_precision": 0.7887700534759359, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.876, "eval_samples_per_second": 213.47, "eval_steps_per_second": 3.425, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.4508860409259796, "learning_rate": 3.7500000000000003e-05, "loss": 0.0542, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8671328671328672, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7272727272727273, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6984126984126984, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8817891373801917, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13426989316940308, "eval_overall_accuracy": 0.9633802816901409, "eval_overall_f1": 0.84, "eval_overall_precision": 0.8121546961325967, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8752, "eval_samples_per_second": 213.654, "eval_steps_per_second": 3.428, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.8999614715576172, "learning_rate": 3.7e-05, "loss": 0.0526, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.8652482269503546, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8472222222222222, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7540983606557378, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.71875, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.761904761904762, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7272727272727273, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1440158635377884, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8412017167381973, "eval_overall_precision": 0.814404432132964, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8876, "eval_samples_per_second": 210.689, "eval_steps_per_second": 3.38, "step": 2756 }, { "epoch": 27.0, "grad_norm": 0.6169599890708923, "learning_rate": 3.65e-05, "loss": 0.0477, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7142857142857142, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6617647058823529, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8662420382165605, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.16048064827919006, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8241912798874824, "eval_overall_precision": 0.7855227882037533, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8784, "eval_samples_per_second": 212.876, "eval_steps_per_second": 3.415, "step": 2862 }, { "epoch": 28.0, "grad_norm": 0.5325952768325806, "learning_rate": 3.6e-05, "loss": 0.048, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8671328671328672, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7086614173228347, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6521739130434783, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1558757722377777, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.830028328611898, "eval_overall_precision": 0.7961956521739131, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8788, "eval_samples_per_second": 212.794, "eval_steps_per_second": 3.414, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.5985626578330994, "learning_rate": 3.55e-05, "loss": 0.0481, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7007299270072993, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6075949367088608, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.15555179119110107, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8282548476454293, "eval_overall_precision": 0.7786458333333334, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.8856, "eval_samples_per_second": 211.154, "eval_steps_per_second": 3.387, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.8177056908607483, "learning_rate": 3.5e-05, "loss": 0.045, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7068965517241379, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7068965517241379, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.761904761904762, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7272727272727273, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1506585329771042, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8342857142857144, "eval_overall_precision": 0.8066298342541437, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.8833, "eval_samples_per_second": 211.711, "eval_steps_per_second": 3.396, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.42287537455558777, "learning_rate": 3.45e-05, "loss": 0.0445, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.8590604026845639, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7343749999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8874598070739551, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.15119028091430664, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8330995792426368, "eval_overall_precision": 0.792, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8769, "eval_samples_per_second": 213.246, "eval_steps_per_second": 3.421, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.3716237246990204, "learning_rate": 3.4000000000000007e-05, "loss": 0.042, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.716417910447761, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.631578947368421, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.877742946708464, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8383233532934131, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8064516129032258, "eval_TIME_number": 29, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1590593457221985, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8303448275862069, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.8744, "eval_samples_per_second": 213.872, "eval_steps_per_second": 3.431, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.18944571912288666, "learning_rate": 3.35e-05, "loss": 0.0394, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7040000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6567164179104478, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1586446911096573, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8276836158192091, "eval_overall_precision": 0.7918918918918919, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8776, "eval_samples_per_second": 213.07, "eval_steps_per_second": 3.418, "step": 3498 }, { "epoch": 34.0, "grad_norm": 1.3505786657333374, "learning_rate": 3.3e-05, "loss": 0.0378, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7131782945736435, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.647887323943662, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.15407726168632507, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8291316526610645, "eval_overall_precision": 0.7872340425531915, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8762, "eval_samples_per_second": 213.42, "eval_steps_per_second": 3.424, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.631050705909729, "learning_rate": 3.2500000000000004e-05, "loss": 0.0375, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6725663716814159, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6909090909090909, "eval_ORGANIZATION_recall": 0.6551724137931034, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.15462984144687653, "eval_overall_accuracy": 0.9626120358514725, "eval_overall_f1": 0.8309455587392551, "eval_overall_precision": 0.8055555555555556, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.8693, "eval_samples_per_second": 215.126, "eval_steps_per_second": 3.451, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.13165172934532166, "learning_rate": 3.2000000000000005e-05, "loss": 0.0384, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.879746835443038, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.761904761904762, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7272727272727273, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.16041359305381775, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.84375, "eval_overall_precision": 0.8114754098360656, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8806, "eval_samples_per_second": 212.356, "eval_steps_per_second": 3.407, "step": 3816 }, { "epoch": 37.0, "grad_norm": 0.39163538813591003, "learning_rate": 3.15e-05, "loss": 0.0337, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7166666666666668, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6935483870967742, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 29, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.16409936547279358, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.8421052631578948, "eval_overall_precision": 0.810958904109589, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8782, "eval_samples_per_second": 212.924, "eval_steps_per_second": 3.416, "step": 3922 }, { "epoch": 38.0, "grad_norm": 1.8893556594848633, "learning_rate": 3.1e-05, "loss": 0.0327, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1764567792415619, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8316831683168318, "eval_overall_precision": 0.7967479674796748, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8812, "eval_samples_per_second": 212.213, "eval_steps_per_second": 3.404, "step": 4028 }, { "epoch": 39.0, "grad_norm": 1.0850064754486084, "learning_rate": 3.05e-05, "loss": 0.033, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.16998325288295746, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8323863636363636, "eval_overall_precision": 0.8005464480874317, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8888, "eval_samples_per_second": 210.391, "eval_steps_per_second": 3.375, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.8192635774612427, "learning_rate": 3e-05, "loss": 0.0333, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.8493150684931507, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7200000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6716417910447762, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.17454804480075836, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8312056737588652, "eval_overall_precision": 0.7983651226158038, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8709, "eval_samples_per_second": 214.732, "eval_steps_per_second": 3.445, "step": 4240 }, { "epoch": 41.0, "grad_norm": 1.14230477809906, "learning_rate": 2.95e-05, "loss": 0.0296, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.851063829787234, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8333333333333334, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7086614173228347, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6521739130434783, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8662420382165605, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.17790456116199493, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.8283687943262411, "eval_overall_precision": 0.7956403269754768, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.8959, "eval_samples_per_second": 208.739, "eval_steps_per_second": 3.349, "step": 4346 }, { "epoch": 42.0, "grad_norm": 1.1531621217727661, "learning_rate": 2.9e-05, "loss": 0.0305, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.851063829787234, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8333333333333334, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6666666666666667, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6176470588235294, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8874598070739551, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1733568161725998, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8297567954220315, "eval_overall_precision": 0.8033240997229917, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.8898, "eval_samples_per_second": 210.16, "eval_steps_per_second": 3.372, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.12765854597091675, "learning_rate": 2.8499999999999998e-05, "loss": 0.029, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.8591549295774648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8356164383561644, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7401574803149606, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8782051282051281, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.18485189974308014, "eval_overall_accuracy": 0.9610755441741358, "eval_overall_f1": 0.8368794326241134, "eval_overall_precision": 0.8038147138964578, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8698, "eval_samples_per_second": 214.991, "eval_steps_per_second": 3.449, "step": 4558 }, { "epoch": 44.0, "grad_norm": 0.6099337935447693, "learning_rate": 2.8000000000000003e-05, "loss": 0.0289, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6942148760330579, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.170259490609169, "eval_overall_accuracy": 0.9610755441741358, "eval_overall_f1": 0.833810888252149, "eval_overall_precision": 0.8083333333333333, "eval_overall_recall": 0.8609467455621301, "eval_runtime": 0.8888, "eval_samples_per_second": 210.406, "eval_steps_per_second": 3.375, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.0691465139389038, "learning_rate": 2.7500000000000004e-05, "loss": 0.0294, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8413793103448277, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8026315789473685, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7540983606557378, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.71875, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8782051282051281, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1816970556974411, "eval_overall_accuracy": 0.9610755441741358, "eval_overall_f1": 0.8352272727272727, "eval_overall_precision": 0.8032786885245902, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8854, "eval_samples_per_second": 211.192, "eval_steps_per_second": 3.388, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.2375423014163971, "learning_rate": 2.7000000000000002e-05, "loss": 0.0262, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7213114754098361, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8874598070739551, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1889667958021164, "eval_overall_accuracy": 0.9626120358514725, "eval_overall_f1": 0.8392603129445234, "eval_overall_precision": 0.8082191780821918, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8885, "eval_samples_per_second": 210.463, "eval_steps_per_second": 3.376, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.48538097739219666, "learning_rate": 2.6500000000000004e-05, "loss": 0.0261, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7438016528925621, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8838709677419354, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8670886075949367, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.18387795984745026, "eval_overall_accuracy": 0.9626120358514725, "eval_overall_f1": 0.8464849354375897, "eval_overall_precision": 0.8217270194986073, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8841, "eval_samples_per_second": 211.519, "eval_steps_per_second": 3.393, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.2411327362060547, "learning_rate": 2.6000000000000002e-05, "loss": 0.027, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7343749999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8838709677419354, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8670886075949367, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.18413321673870087, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8389830508474576, "eval_overall_precision": 0.8027027027027027, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8687, "eval_samples_per_second": 215.275, "eval_steps_per_second": 3.454, "step": 5088 }, { "epoch": 49.0, "grad_norm": 1.1320481300354004, "learning_rate": 2.5500000000000003e-05, "loss": 0.0243, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.8652482269503546, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8472222222222222, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.717948717948718, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.711864406779661, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.18021155893802643, "eval_overall_accuracy": 0.9628681177976952, "eval_overall_f1": 0.8405797101449276, "eval_overall_precision": 0.8238636363636364, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.8873, "eval_samples_per_second": 210.759, "eval_steps_per_second": 3.381, "step": 5194 }, { "epoch": 50.0, "grad_norm": 0.6338851451873779, "learning_rate": 2.5e-05, "loss": 0.0243, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7040000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6567164179104478, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1869899332523346, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.8345120226308346, "eval_overall_precision": 0.7994579945799458, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8731, "eval_samples_per_second": 214.182, "eval_steps_per_second": 3.436, "step": 5300 }, { "epoch": 51.0, "grad_norm": 2.7834653854370117, "learning_rate": 2.45e-05, "loss": 0.0256, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7022900763358779, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6301369863013698, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8838709677419354, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8670886075949367, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.19200466573238373, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.8356940509915014, "eval_overall_precision": 0.8016304347826086, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8812, "eval_samples_per_second": 212.219, "eval_steps_per_second": 3.405, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.22858576476573944, "learning_rate": 2.4e-05, "loss": 0.0233, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.716417910447761, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.631578947368421, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7931034482758621, "eval_TIME_number": 29, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.19999483227729797, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.8302945301542777, "eval_overall_precision": 0.7893333333333333, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8802, "eval_samples_per_second": 212.441, "eval_steps_per_second": 3.408, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.8902926445007324, "learning_rate": 2.35e-05, "loss": 0.0233, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.853146853146853, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8243243243243243, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6923076923076923, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.19701984524726868, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.8265162200282087, "eval_overall_precision": 0.7897574123989218, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8753, "eval_samples_per_second": 213.637, "eval_steps_per_second": 3.427, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.5953955054283142, "learning_rate": 2.3000000000000003e-05, "loss": 0.0211, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7200000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6716417910447762, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.8064516129032259, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.21723441779613495, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8293370944992947, "eval_overall_precision": 0.7924528301886793, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8826, "eval_samples_per_second": 211.865, "eval_steps_per_second": 3.399, "step": 5724 }, { "epoch": 55.0, "grad_norm": 2.6492440700531006, "learning_rate": 2.25e-05, "loss": 0.0217, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6507936507936507, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6029411764705882, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.8838709677419354, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8670886075949367, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.8064516129032259, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.19644935429096222, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.829059829059829, "eval_overall_precision": 0.7994505494505495, "eval_overall_recall": 0.8609467455621301, "eval_runtime": 0.8838, "eval_samples_per_second": 211.588, "eval_steps_per_second": 3.394, "step": 5830 }, { "epoch": 56.0, "grad_norm": 0.8844048380851746, "learning_rate": 2.2000000000000003e-05, "loss": 0.0214, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7096774193548386, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8817891373801917, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.8064516129032259, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.20219193398952484, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8404558404558404, "eval_overall_precision": 0.8104395604395604, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8832, "eval_samples_per_second": 211.741, "eval_steps_per_second": 3.397, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.3619399666786194, "learning_rate": 2.15e-05, "loss": 0.0197, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8493150684931507, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7049180327868853, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.671875, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.20077820122241974, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.8330955777460769, "eval_overall_precision": 0.8044077134986226, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.9531, "eval_samples_per_second": 196.195, "eval_steps_per_second": 3.148, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.1735541820526123, "learning_rate": 2.1e-05, "loss": 0.0216, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7131782945736435, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.647887323943662, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8782051282051281, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.21140815317630768, "eval_overall_accuracy": 0.9597951344430218, "eval_overall_f1": 0.8333333333333334, "eval_overall_precision": 0.7972972972972973, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8863, "eval_samples_per_second": 210.995, "eval_steps_per_second": 3.385, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.837820291519165, "learning_rate": 2.05e-05, "loss": 0.0197, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7244094488188977, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.20840610563755035, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8389830508474576, "eval_overall_precision": 0.8027027027027027, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8868, "eval_samples_per_second": 210.865, "eval_steps_per_second": 3.383, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.5633171796798706, "learning_rate": 2e-05, "loss": 0.0182, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7286821705426356, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8726114649681528, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21587228775024414, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8370786516853933, "eval_overall_precision": 0.7967914438502673, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8748, "eval_samples_per_second": 213.775, "eval_steps_per_second": 3.43, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.4832909405231476, "learning_rate": 1.9500000000000003e-05, "loss": 0.0196, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7200000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6716417910447762, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.20733201503753662, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8425531914893617, "eval_overall_precision": 0.8092643051771117, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.9535, "eval_samples_per_second": 196.123, "eval_steps_per_second": 3.146, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.6487990617752075, "learning_rate": 1.9e-05, "loss": 0.0176, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8671328671328672, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7213114754098361, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8769716088328074, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7931034482758621, "eval_TIME_number": 29, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.20125307142734528, "eval_overall_accuracy": 0.9605633802816902, "eval_overall_f1": 0.8335704125177809, "eval_overall_precision": 0.8027397260273973, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8874, "eval_samples_per_second": 210.718, "eval_steps_per_second": 3.38, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.8727775812149048, "learning_rate": 1.85e-05, "loss": 0.0157, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.8356164383561644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6833333333333333, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6612903225806451, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.8838709677419354, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8670886075949367, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.8064516129032259, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.20443986356258392, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.828080229226361, "eval_overall_precision": 0.8027777777777778, "eval_overall_recall": 0.8550295857988166, "eval_runtime": 0.8782, "eval_samples_per_second": 212.933, "eval_steps_per_second": 3.416, "step": 6678 }, { "epoch": 64.0, "grad_norm": 1.5122424364089966, "learning_rate": 1.8e-05, "loss": 0.0177, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.8476821192052981, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7175572519083969, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8652037617554859, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8263473053892215, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.22791583836078644, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.8298755186721992, "eval_overall_precision": 0.7792207792207793, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.8723, "eval_samples_per_second": 214.372, "eval_steps_per_second": 3.439, "step": 6784 }, { "epoch": 65.0, "grad_norm": 1.5700312852859497, "learning_rate": 1.75e-05, "loss": 0.0165, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.8493150684931507, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8698412698412699, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.761904761904762, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7272727272727273, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.21637500822544098, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8265162200282087, "eval_overall_precision": 0.7897574123989218, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.8725, "eval_samples_per_second": 214.338, "eval_steps_per_second": 3.439, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.9781705737113953, "learning_rate": 1.7000000000000003e-05, "loss": 0.0171, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.746031746031746, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6911764705882353, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8734177215189874, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21887072920799255, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8426966292134831, "eval_overall_precision": 0.8021390374331551, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.8649, "eval_samples_per_second": 216.219, "eval_steps_per_second": 3.469, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.7777842879295349, "learning_rate": 1.65e-05, "loss": 0.0167, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.8590604026845639, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7286821705426356, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7812500000000001, "eval_TIME_number": 29, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.23059594631195068, "eval_overall_accuracy": 0.9597951344430218, "eval_overall_f1": 0.8337950138504154, "eval_overall_precision": 0.7838541666666666, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.8828, "eval_samples_per_second": 211.834, "eval_steps_per_second": 3.398, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.42934471368789673, "learning_rate": 1.6000000000000003e-05, "loss": 0.0156, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7580645161290323, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7121212121212122, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.8064516129032259, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21977542340755463, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.8498583569405098, "eval_overall_precision": 0.8152173913043478, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.8618, "eval_samples_per_second": 216.978, "eval_steps_per_second": 3.481, "step": 7208 }, { "epoch": 69.0, "grad_norm": 1.0344369411468506, "learning_rate": 1.55e-05, "loss": 0.0156, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8590604026845639, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7175572519083969, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.21617823839187622, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8398876404494382, "eval_overall_precision": 0.7994652406417112, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.8721, "eval_samples_per_second": 214.436, "eval_steps_per_second": 3.44, "step": 7314 }, { "epoch": 70.0, "grad_norm": 1.9640426635742188, "learning_rate": 1.5e-05, "loss": 0.0155, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.8421052631578948, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7086614173228347, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6521739130434783, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8797468354430381, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.22830812633037567, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.83008356545961, "eval_overall_precision": 0.7842105263157895, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8737, "eval_samples_per_second": 214.022, "eval_steps_per_second": 3.434, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.16448061168193817, "learning_rate": 1.45e-05, "loss": 0.0142, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6911764705882352, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6025641025641025, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8782051282051281, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2332638055086136, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.83008356545961, "eval_overall_precision": 0.7842105263157895, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8749, "eval_samples_per_second": 213.733, "eval_steps_per_second": 3.429, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.25591084361076355, "learning_rate": 1.4000000000000001e-05, "loss": 0.0165, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7401574803149606, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.8253968253968254, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2185453474521637, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8429985855728428, "eval_overall_precision": 0.8075880758807588, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8809, "eval_samples_per_second": 212.292, "eval_steps_per_second": 3.406, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.047924935817718506, "learning_rate": 1.3500000000000001e-05, "loss": 0.0145, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8378378378378378, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8607594936708861, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.8253968253968254, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.22260642051696777, "eval_overall_accuracy": 0.9605633802816902, "eval_overall_f1": 0.8352272727272727, "eval_overall_precision": 0.8032786885245902, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8798, "eval_samples_per_second": 212.544, "eval_steps_per_second": 3.41, "step": 7738 }, { "epoch": 74.0, "grad_norm": 0.29497218132019043, "learning_rate": 1.3000000000000001e-05, "loss": 0.0135, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 29, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2320089489221573, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8316831683168318, "eval_overall_precision": 0.7967479674796748, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8782, "eval_samples_per_second": 212.931, "eval_steps_per_second": 3.416, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.01762392371892929, "learning_rate": 1.25e-05, "loss": 0.0138, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7286821705426356, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8789808917197451, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.2413773536682129, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8324022346368716, "eval_overall_precision": 0.7883597883597884, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.883, "eval_samples_per_second": 211.783, "eval_steps_per_second": 3.398, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.21732616424560547, "learning_rate": 1.2e-05, "loss": 0.0129, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7213114754098361, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.8387096774193549, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.8125, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.22952446341514587, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8473609129814551, "eval_overall_precision": 0.8181818181818182, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8794, "eval_samples_per_second": 212.653, "eval_steps_per_second": 3.412, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.42748743295669556, "learning_rate": 1.1500000000000002e-05, "loss": 0.0118, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8322147651006713, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8734177215189874, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.23922854661941528, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8319327731092437, "eval_overall_precision": 0.7898936170212766, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8708, "eval_samples_per_second": 214.745, "eval_steps_per_second": 3.445, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.6394297480583191, "learning_rate": 1.1000000000000001e-05, "loss": 0.0127, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.736, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6865671641791045, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.2345399558544159, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8433048433048432, "eval_overall_precision": 0.8131868131868132, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8826, "eval_samples_per_second": 211.871, "eval_steps_per_second": 3.399, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.5575834512710571, "learning_rate": 1.05e-05, "loss": 0.0122, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.746031746031746, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6911764705882353, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.24232904613018036, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.8410689170182841, "eval_overall_precision": 0.8016085790884718, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.8823, "eval_samples_per_second": 211.957, "eval_steps_per_second": 3.4, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.14352549612522125, "learning_rate": 1e-05, "loss": 0.0117, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.881118881118881, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8513513513513513, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7317073170731708, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8782051282051281, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8275862068965517, "eval_TIME_number": 29, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.22932307422161102, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.8412017167381973, "eval_overall_precision": 0.814404432132964, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.882, "eval_samples_per_second": 212.026, "eval_steps_per_second": 3.401, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.47307726740837097, "learning_rate": 9.5e-06, "loss": 0.012, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8881789137380192, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.761904761904762, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7272727272727273, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.23925283551216125, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8370786516853933, "eval_overall_precision": 0.7967914438502673, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8824, "eval_samples_per_second": 211.922, "eval_steps_per_second": 3.4, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.2593061923980713, "learning_rate": 9e-06, "loss": 0.013, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7333333333333333, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7096774193548387, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.23163729906082153, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.8404558404558404, "eval_overall_precision": 0.8104395604395604, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8706, "eval_samples_per_second": 214.791, "eval_steps_per_second": 3.446, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.8594510555267334, "learning_rate": 8.500000000000002e-06, "loss": 0.0115, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.8435374149659864, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7948717948717948, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7096774193548386, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8874598070739551, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.23205186426639557, "eval_overall_accuracy": 0.9605633802816902, "eval_overall_f1": 0.8380681818181818, "eval_overall_precision": 0.8060109289617486, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.8704, "eval_samples_per_second": 214.832, "eval_steps_per_second": 3.447, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.06097917631268501, "learning_rate": 8.000000000000001e-06, "loss": 0.0124, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7107438016528926, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6825396825396826, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.891025641025641, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.23106266558170319, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8433048433048432, "eval_overall_precision": 0.8131868131868132, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8817, "eval_samples_per_second": 212.094, "eval_steps_per_second": 3.403, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.0979015976190567, "learning_rate": 7.5e-06, "loss": 0.0118, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7096774193548386, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.24057278037071228, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8328611898016997, "eval_overall_precision": 0.7989130434782609, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.9001, "eval_samples_per_second": 207.748, "eval_steps_per_second": 3.333, "step": 9010 }, { "epoch": 86.0, "grad_norm": 2.0524749755859375, "learning_rate": 7.000000000000001e-06, "loss": 0.0115, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7317073170731708, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8817891373801917, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.23790757358074188, "eval_overall_accuracy": 0.9610755441741358, "eval_overall_f1": 0.8373408769448374, "eval_overall_precision": 0.8021680216802168, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8768, "eval_samples_per_second": 213.284, "eval_steps_per_second": 3.422, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.27762410044670105, "learning_rate": 6.5000000000000004e-06, "loss": 0.0116, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7419354838709677, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.696969696969697, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.8064516129032259, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.23644272983074188, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.8453900709219858, "eval_overall_precision": 0.8119891008174387, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8829, "eval_samples_per_second": 211.807, "eval_steps_per_second": 3.398, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.8406667709350586, "learning_rate": 6e-06, "loss": 0.0107, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7272727272727273, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6984126984126984, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2356145679950714, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8412017167381973, "eval_overall_precision": 0.814404432132964, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.8796, "eval_samples_per_second": 212.593, "eval_steps_per_second": 3.411, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.5086352825164795, "learning_rate": 5.500000000000001e-06, "loss": 0.0099, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8874598070739551, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2441495656967163, "eval_overall_accuracy": 0.9610755441741358, "eval_overall_f1": 0.8413597733711048, "eval_overall_precision": 0.8070652173913043, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8816, "eval_samples_per_second": 212.126, "eval_steps_per_second": 3.403, "step": 9434 }, { "epoch": 90.0, "grad_norm": 0.11222498118877411, "learning_rate": 5e-06, "loss": 0.0116, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.8064516129032259, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 29, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.24032947421073914, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8470254957507082, "eval_overall_precision": 0.8125, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.8666, "eval_samples_per_second": 215.798, "eval_steps_per_second": 3.462, "step": 9540 }, { "epoch": 91.0, "grad_norm": 1.0016977787017822, "learning_rate": 4.5e-06, "loss": 0.0101, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.736, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6865671641791045, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.891025641025641, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.24104949831962585, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.84822695035461, "eval_overall_precision": 0.8147138964577657, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.8925, "eval_samples_per_second": 209.524, "eval_steps_per_second": 3.361, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.5980203151702881, "learning_rate": 4.000000000000001e-06, "loss": 0.0104, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8378378378378378, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7377049180327868, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.703125, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.891025641025641, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.2380075305700302, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8421052631578948, "eval_overall_precision": 0.810958904109589, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.9541, "eval_samples_per_second": 195.995, "eval_steps_per_second": 3.144, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.1031588539481163, "learning_rate": 3.5000000000000004e-06, "loss": 0.0113, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.23934581875801086, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.8409090909090909, "eval_overall_precision": 0.8087431693989071, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.9053, "eval_samples_per_second": 206.559, "eval_steps_per_second": 3.314, "step": 9858 }, { "epoch": 94.0, "grad_norm": 1.1558283567428589, "learning_rate": 3e-06, "loss": 0.0104, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.2401016503572464, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8421052631578948, "eval_overall_precision": 0.810958904109589, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8815, "eval_samples_per_second": 212.144, "eval_steps_per_second": 3.403, "step": 9964 }, { "epoch": 95.0, "grad_norm": 1.1983808279037476, "learning_rate": 2.5e-06, "loss": 0.0108, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.8493150684931507, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8051948051948052, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.746031746031746, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6911764705882353, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.2409784197807312, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8425531914893617, "eval_overall_precision": 0.8092643051771117, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8891, "eval_samples_per_second": 210.332, "eval_steps_per_second": 3.374, "step": 10070 }, { "epoch": 96.0, "grad_norm": 1.2160520553588867, "learning_rate": 2.0000000000000003e-06, "loss": 0.0102, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7200000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6716417910447762, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2440604716539383, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.840620592383639, "eval_overall_precision": 0.8032345013477089, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.9399, "eval_samples_per_second": 198.966, "eval_steps_per_second": 3.192, "step": 10176 }, { "epoch": 97.0, "grad_norm": 1.8695564270019531, "learning_rate": 1.5e-06, "loss": 0.0099, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.891025641025641, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.24207578599452972, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8453900709219858, "eval_overall_precision": 0.8119891008174387, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8801, "eval_samples_per_second": 212.469, "eval_steps_per_second": 3.409, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.15321999788284302, "learning_rate": 1.0000000000000002e-06, "loss": 0.009, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.891025641025641, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 29, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.24271713197231293, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8453900709219858, "eval_overall_precision": 0.8119891008174387, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.8771, "eval_samples_per_second": 213.205, "eval_steps_per_second": 3.42, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.49585482478141785, "learning_rate": 5.000000000000001e-07, "loss": 0.0096, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7096774193548386, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.891025641025641, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.24335408210754395, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.8413597733711048, "eval_overall_precision": 0.8070652173913043, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.8907, "eval_samples_per_second": 209.939, "eval_steps_per_second": 3.368, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.202548086643219, "learning_rate": 0.0, "loss": 0.0099, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7096774193548386, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8846153846153847, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.24319376051425934, "eval_overall_accuracy": 0.9610755441741358, "eval_overall_f1": 0.8385269121813032, "eval_overall_precision": 0.8043478260869565, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.8912, "eval_samples_per_second": 209.818, "eval_steps_per_second": 3.366, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5072850468719490.0, "train_loss": 0.05464491794694145, "train_runtime": 1550.8875, "train_samples_per_second": 108.776, "train_steps_per_second": 6.835 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5072850468719490.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }