{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.1874585151672363, "learning_rate": 4.9500000000000004e-05, "loss": 1.0045, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.012121212121212121, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.06666666666666667, "eval_PERSON_recall": 0.006666666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 28, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.5767342448234558, "eval_overall_accuracy": 0.8433559650824443, "eval_overall_f1": 0.005434782608695652, "eval_overall_precision": 0.047619047619047616, "eval_overall_recall": 0.002881844380403458, "eval_runtime": 0.3512, "eval_samples_per_second": 532.399, "eval_steps_per_second": 8.541, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.000261664390564, "learning_rate": 4.9e-05, "loss": 0.4985, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.3859649122807017, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5116279069767442, "eval_LOCATION_recall": 0.30985915492957744, "eval_ORGANIZATION_f1": 0.14184397163120568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.13157894736842105, "eval_ORGANIZATION_recall": 0.15384615384615385, "eval_PERSON_f1": 0.7315634218289085, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.656084656084656, "eval_PERSON_recall": 0.8266666666666667, "eval_QUANTITY_f1": 0.15625, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.16129032258064516, "eval_QUANTITY_recall": 0.15151515151515152, "eval_TIME_f1": 0.7, "eval_TIME_number": 28, "eval_TIME_precision": 0.65625, "eval_TIME_recall": 0.75, "eval_loss": 0.34785470366477966, "eval_overall_accuracy": 0.9083414161008729, "eval_overall_f1": 0.5069637883008357, "eval_overall_precision": 0.49056603773584906, "eval_overall_recall": 0.5244956772334294, "eval_runtime": 0.3485, "eval_samples_per_second": 536.657, "eval_steps_per_second": 8.609, "step": 212 }, { "epoch": 3.0, "grad_norm": 0.8842161297798157, "learning_rate": 4.85e-05, "loss": 0.2936, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.6119402985074627, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6507936507936508, "eval_LOCATION_recall": 0.5774647887323944, "eval_ORGANIZATION_f1": 0.4255319148936171, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.39473684210526316, "eval_ORGANIZATION_recall": 0.46153846153846156, "eval_PERSON_f1": 0.8238993710691823, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7797619047619048, "eval_PERSON_recall": 0.8733333333333333, "eval_QUANTITY_f1": 0.5866666666666667, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5238095238095238, "eval_QUANTITY_recall": 0.6666666666666666, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2019408941268921, "eval_overall_accuracy": 0.9340446168768186, "eval_overall_f1": 0.6850828729281768, "eval_overall_precision": 0.6578249336870027, "eval_overall_recall": 0.7146974063400576, "eval_runtime": 0.3515, "eval_samples_per_second": 531.999, "eval_steps_per_second": 8.535, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.0422954559326172, "learning_rate": 4.8e-05, "loss": 0.2113, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.6666666666666667, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.611764705882353, "eval_LOCATION_recall": 0.7323943661971831, "eval_ORGANIZATION_f1": 0.6583850931677019, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5520833333333334, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8473520249221183, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7953216374269005, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1662513017654419, "eval_overall_accuracy": 0.9459262851600388, "eval_overall_f1": 0.7574578469520102, "eval_overall_precision": 0.6886792452830188, "eval_overall_recall": 0.8414985590778098, "eval_runtime": 0.3504, "eval_samples_per_second": 533.64, "eval_steps_per_second": 8.561, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.0871312618255615, "learning_rate": 4.75e-05, "loss": 0.1824, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.6951219512195121, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6129032258064516, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.6580645161290322, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5666666666666667, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8607594936708859, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8192771084337349, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.75, "eval_TIME_number": 28, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15956708788871765, "eval_overall_accuracy": 0.944713870029098, "eval_overall_f1": 0.7609254498714653, "eval_overall_precision": 0.6867749419953596, "eval_overall_recall": 0.8530259365994236, "eval_runtime": 0.3507, "eval_samples_per_second": 533.247, "eval_steps_per_second": 8.555, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.1978598833084106, "learning_rate": 4.7e-05, "loss": 0.1647, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.6946107784431137, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6041666666666666, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.651685393258427, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5132743362831859, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8404907975460122, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7784090909090909, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6588235294117647, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5384615384615384, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7164179104477612, "eval_TIME_number": 28, "eval_TIME_precision": 0.6153846153846154, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1713540256023407, "eval_overall_accuracy": 0.9369544131910766, "eval_overall_f1": 0.741190765492102, "eval_overall_precision": 0.6407563025210085, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3521, "eval_samples_per_second": 531.071, "eval_steps_per_second": 8.52, "step": 636 }, { "epoch": 7.0, "grad_norm": 1.5508997440338135, "learning_rate": 4.6500000000000005e-05, "loss": 0.1533, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.6993865030674846, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6195652173913043, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.6790123456790124, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5670103092783505, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8598130841121495, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8070175438596491, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.806451612903226, "eval_TIME_number": 28, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14624279737472534, "eval_overall_accuracy": 0.9510184287099903, "eval_overall_f1": 0.770408163265306, "eval_overall_precision": 0.6910755148741419, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3512, "eval_samples_per_second": 532.397, "eval_steps_per_second": 8.541, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.8642424941062927, "learning_rate": 4.600000000000001e-05, "loss": 0.1405, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7407407407407407, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6593406593406593, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6783625730994152, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5471698113207547, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13807082176208496, "eval_overall_accuracy": 0.950533462657614, "eval_overall_f1": 0.7861715749039692, "eval_overall_precision": 0.7073732718894009, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3504, "eval_samples_per_second": 533.624, "eval_steps_per_second": 8.561, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.233667254447937, "learning_rate": 4.55e-05, "loss": 0.1341, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6785714285714285, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5533980582524272, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8562091503267975, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8397435897435898, "eval_PERSON_recall": 0.8733333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13261349499225616, "eval_overall_accuracy": 0.9495635305528612, "eval_overall_f1": 0.7869281045751635, "eval_overall_precision": 0.7200956937799043, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3537, "eval_samples_per_second": 528.626, "eval_steps_per_second": 8.481, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.0353517532348633, "learning_rate": 4.5e-05, "loss": 0.1274, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7096774193548387, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1223028227686882, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8191489361702129, "eval_overall_precision": 0.7604938271604939, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3511, "eval_samples_per_second": 532.631, "eval_steps_per_second": 8.545, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.7219051122665405, "learning_rate": 4.4500000000000004e-05, "loss": 0.1232, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7204968944099378, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6041666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1300116926431656, "eval_overall_accuracy": 0.9529582929194956, "eval_overall_f1": 0.8083989501312335, "eval_overall_precision": 0.7421686746987952, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3501, "eval_samples_per_second": 534.192, "eval_steps_per_second": 8.57, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.0894474983215332, "learning_rate": 4.4000000000000006e-05, "loss": 0.1195, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.728395061728395, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6483516483516484, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.6909090909090909, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.57, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14111082255840302, "eval_overall_accuracy": 0.9522308438409312, "eval_overall_f1": 0.7917205692108668, "eval_overall_precision": 0.7183098591549296, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3502, "eval_samples_per_second": 534.002, "eval_steps_per_second": 8.567, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.5753965377807617, "learning_rate": 4.35e-05, "loss": 0.1138, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7239263803680982, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6020408163265306, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.9259259259259259, "eval_TIME_number": 28, "eval_TIME_precision": 0.9615384615384616, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12571823596954346, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8260292164674636, "eval_overall_precision": 0.7660098522167488, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3506, "eval_samples_per_second": 533.355, "eval_steps_per_second": 8.556, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.7395552396774292, "learning_rate": 4.3e-05, "loss": 0.1106, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7160493827160493, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5979381443298969, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1278010457754135, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.8104575163398693, "eval_overall_precision": 0.7416267942583732, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3503, "eval_samples_per_second": 533.795, "eval_steps_per_second": 8.564, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.1085916757583618, "learning_rate": 4.25e-05, "loss": 0.1037, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7375, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6210526315789474, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.691358024691358, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5833333333333334, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1332232654094696, "eval_overall_accuracy": 0.953443258971872, "eval_overall_f1": 0.81877444589309, "eval_overall_precision": 0.7476190476190476, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3501, "eval_samples_per_second": 534.13, "eval_steps_per_second": 8.569, "step": 1590 }, { "epoch": 16.0, "grad_norm": 1.2298065423965454, "learning_rate": 4.2e-05, "loss": 0.1015, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7453416149068324, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6506024096385542, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.54, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13960066437721252, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.811443433029909, "eval_overall_precision": 0.7393364928909952, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3495, "eval_samples_per_second": 535.049, "eval_steps_per_second": 8.584, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.7031758427619934, "learning_rate": 4.15e-05, "loss": 0.0958, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.728395061728395, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6082474226804123, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12715467810630798, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8274044795783926, "eval_overall_precision": 0.7621359223300971, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3498, "eval_samples_per_second": 534.552, "eval_steps_per_second": 8.576, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.8438174724578857, "learning_rate": 4.1e-05, "loss": 0.0957, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7017543859649122, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5660377358490566, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14869378507137299, "eval_overall_accuracy": 0.9527158098933075, "eval_overall_f1": 0.8067010309278351, "eval_overall_precision": 0.7296037296037297, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3502, "eval_samples_per_second": 534.029, "eval_steps_per_second": 8.567, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.7291853427886963, "learning_rate": 4.05e-05, "loss": 0.0943, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7195121951219511, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5959595959595959, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12535077333450317, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8258575197889182, "eval_overall_precision": 0.7615571776155717, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3513, "eval_samples_per_second": 532.375, "eval_steps_per_second": 8.541, "step": 2014 }, { "epoch": 20.0, "grad_norm": 1.0950889587402344, "learning_rate": 4e-05, "loss": 0.0915, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7421383647798743, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6276595744680851, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.9259259259259259, "eval_TIME_number": 28, "eval_TIME_precision": 0.9615384615384616, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12668967247009277, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8335552596537948, "eval_overall_precision": 0.7747524752475248, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3504, "eval_samples_per_second": 533.636, "eval_steps_per_second": 8.561, "step": 2120 }, { "epoch": 21.0, "grad_norm": 1.227335810661316, "learning_rate": 3.9500000000000005e-05, "loss": 0.0834, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.7672955974842768, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6931818181818182, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7239263803680982, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6020408163265306, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6410256410256411, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5555555555555556, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1432582437992096, "eval_overall_accuracy": 0.953443258971872, "eval_overall_f1": 0.8057366362451109, "eval_overall_precision": 0.7357142857142858, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3505, "eval_samples_per_second": 533.585, "eval_steps_per_second": 8.56, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.8867971301078796, "learning_rate": 3.9000000000000006e-05, "loss": 0.0839, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7329192546583851, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6145833333333334, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6582278481012658, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5652173913043478, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14338690042495728, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.8184210526315788, "eval_overall_precision": 0.7530266343825666, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3497, "eval_samples_per_second": 534.745, "eval_steps_per_second": 8.579, "step": 2332 }, { "epoch": 23.0, "grad_norm": 1.0698140859603882, "learning_rate": 3.85e-05, "loss": 0.0807, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7195121951219511, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5959595959595959, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.912621359223301, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13598859310150146, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8252299605781866, "eval_overall_precision": 0.7584541062801933, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3499, "eval_samples_per_second": 534.445, "eval_steps_per_second": 8.574, "step": 2438 }, { "epoch": 24.0, "grad_norm": 0.7420476675033569, "learning_rate": 3.8e-05, "loss": 0.0771, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7215189873417722, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6129032258064516, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9137380191693292, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8773006134969326, "eval_PERSON_recall": 0.9533333333333334, "eval_QUANTITY_f1": 0.6419753086419753, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5416666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14340347051620483, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.8152031454783748, "eval_overall_precision": 0.7475961538461539, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3509, "eval_samples_per_second": 532.923, "eval_steps_per_second": 8.55, "step": 2544 }, { "epoch": 25.0, "grad_norm": 1.0963969230651855, "learning_rate": 3.7500000000000003e-05, "loss": 0.0772, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7065868263473054, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5784313725490197, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6428571428571428, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5294117647058824, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1520393043756485, "eval_overall_accuracy": 0.9502909796314258, "eval_overall_f1": 0.8010269576379975, "eval_overall_precision": 0.7222222222222222, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3508, "eval_samples_per_second": 533.007, "eval_steps_per_second": 8.551, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.38709110021591187, "learning_rate": 3.7e-05, "loss": 0.0732, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7499999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.631578947368421, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.9259259259259259, "eval_TIME_number": 28, "eval_TIME_precision": 0.9615384615384616, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14221937954425812, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8243064729194188, "eval_overall_precision": 0.7609756097560976, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3493, "eval_samples_per_second": 535.398, "eval_steps_per_second": 8.589, "step": 2756 }, { "epoch": 27.0, "grad_norm": 0.5424766540527344, "learning_rate": 3.65e-05, "loss": 0.0731, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7564102564102564, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6483516483516484, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.65, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5531914893617021, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.13665592670440674, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8184210526315788, "eval_overall_precision": 0.7530266343825666, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3499, "eval_samples_per_second": 534.475, "eval_steps_per_second": 8.574, "step": 2862 }, { "epoch": 28.0, "grad_norm": 2.6486599445343018, "learning_rate": 3.6e-05, "loss": 0.0697, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7160493827160493, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5979381443298969, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9142857142857144, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8727272727272727, "eval_PERSON_recall": 0.96, "eval_QUANTITY_f1": 0.6329113924050633, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5434782608695652, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14497701823711395, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8151041666666666, "eval_overall_precision": 0.7434679334916865, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3505, "eval_samples_per_second": 533.595, "eval_steps_per_second": 8.56, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.7765714526176453, "learning_rate": 3.55e-05, "loss": 0.0689, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7085714285714286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5636363636363636, "eval_ORGANIZATION_recall": 0.9538461538461539, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7936507936507937, "eval_TIME_number": 28, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15288624167442322, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.8097686375321336, "eval_overall_precision": 0.7308584686774942, "eval_overall_recall": 0.9077809798270894, "eval_runtime": 0.3501, "eval_samples_per_second": 534.16, "eval_steps_per_second": 8.569, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.8394734263420105, "learning_rate": 3.5e-05, "loss": 0.0669, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7421383647798743, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6276595744680851, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14122405648231506, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8157894736842105, "eval_overall_precision": 0.7506053268765133, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3503, "eval_samples_per_second": 533.82, "eval_steps_per_second": 8.564, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.43885117769241333, "learning_rate": 3.45e-05, "loss": 0.0654, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.779874213836478, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7045454545454546, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7741935483870968, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13700760900974274, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8227513227513227, "eval_overall_precision": 0.7603911980440098, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3506, "eval_samples_per_second": 533.416, "eval_steps_per_second": 8.557, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.3841339647769928, "learning_rate": 3.4000000000000007e-05, "loss": 0.0639, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7108433734939759, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5841584158415841, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14966341853141785, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.81151832460733, "eval_overall_precision": 0.7434052757793765, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3501, "eval_samples_per_second": 534.13, "eval_steps_per_second": 8.569, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.86671382188797, "learning_rate": 3.35e-05, "loss": 0.0637, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9009584664536742, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13783931732177734, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8213333333333332, "eval_overall_precision": 0.7642679900744417, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3499, "eval_samples_per_second": 534.488, "eval_steps_per_second": 8.575, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.8965917229652405, "learning_rate": 3.3e-05, "loss": 0.0625, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8181818181818181, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.759493670886076, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6451612903225806, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14487268030643463, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8333333333333334, "eval_overall_precision": 0.7701711491442543, "eval_overall_recall": 0.9077809798270894, "eval_runtime": 0.3507, "eval_samples_per_second": 533.265, "eval_steps_per_second": 8.555, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.7054619193077087, "learning_rate": 3.2500000000000004e-05, "loss": 0.0634, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.7898089171974522, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7209302325581395, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14537405967712402, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.821664464993395, "eval_overall_precision": 0.7585365853658537, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.35, "eval_samples_per_second": 534.224, "eval_steps_per_second": 8.57, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.9769655466079712, "learning_rate": 3.2000000000000005e-05, "loss": 0.0592, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7672955974842768, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.648936170212766, "eval_ORGANIZATION_recall": 0.9384615384615385, "eval_PERSON_f1": 0.9067524115755627, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 28, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1611613929271698, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8298429319371728, "eval_overall_precision": 0.7601918465227818, "eval_overall_recall": 0.9135446685878963, "eval_runtime": 0.3514, "eval_samples_per_second": 532.12, "eval_steps_per_second": 8.537, "step": 3816 }, { "epoch": 37.0, "grad_norm": 0.828741192817688, "learning_rate": 3.15e-05, "loss": 0.0597, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.7643312101910827, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6976744186046512, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7439024390243902, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6161616161616161, "eval_ORGANIZATION_recall": 0.9384615384615385, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5777777777777777, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1625693291425705, "eval_overall_accuracy": 0.953443258971872, "eval_overall_f1": 0.8093385214007783, "eval_overall_precision": 0.7358490566037735, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3504, "eval_samples_per_second": 533.713, "eval_steps_per_second": 8.562, "step": 3922 }, { "epoch": 38.0, "grad_norm": 1.4891364574432373, "learning_rate": 3.1e-05, "loss": 0.0573, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8859934853420196, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8662420382165605, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7027027027027027, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6341463414634146, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1448131501674652, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8172043010752689, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3501, "eval_samples_per_second": 534.187, "eval_steps_per_second": 8.57, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.5322253704071045, "learning_rate": 3.05e-05, "loss": 0.0561, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7643312101910829, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6521739130434783, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14745843410491943, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8243064729194188, "eval_overall_precision": 0.7609756097560976, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3508, "eval_samples_per_second": 533.023, "eval_steps_per_second": 8.551, "step": 4134 }, { "epoch": 40.0, "grad_norm": 1.2674453258514404, "learning_rate": 3e-05, "loss": 0.0521, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7169811320754718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6063829787234043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7222222222222221, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.806451612903226, "eval_TIME_number": 28, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14856770634651184, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8158940397350992, "eval_overall_precision": 0.7549019607843137, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3497, "eval_samples_per_second": 534.717, "eval_steps_per_second": 8.578, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.23710742592811584, "learning_rate": 2.95e-05, "loss": 0.0526, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7272727272727274, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6363636363636364, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15941469371318817, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8135593220338984, "eval_overall_precision": 0.7428571428571429, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3497, "eval_samples_per_second": 534.713, "eval_steps_per_second": 8.578, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.5749427080154419, "learning_rate": 2.9e-05, "loss": 0.0505, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8533333333333334, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 28, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1528312712907791, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8317631224764469, "eval_overall_precision": 0.7803030303030303, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3505, "eval_samples_per_second": 533.466, "eval_steps_per_second": 8.558, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.5371730923652649, "learning_rate": 2.8499999999999998e-05, "loss": 0.0497, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7006369426751592, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5978260869565217, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 28, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14798860251903534, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8068331143232589, "eval_overall_precision": 0.7415458937198067, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3497, "eval_samples_per_second": 534.734, "eval_steps_per_second": 8.579, "step": 4558 }, { "epoch": 44.0, "grad_norm": 0.9185490608215332, "learning_rate": 2.8000000000000003e-05, "loss": 0.0525, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6933333333333334, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6190476190476191, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 28, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15042471885681152, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8243064729194188, "eval_overall_precision": 0.7609756097560976, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3507, "eval_samples_per_second": 533.267, "eval_steps_per_second": 8.555, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.4481260776519775, "learning_rate": 2.7500000000000004e-05, "loss": 0.0486, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8289473684210527, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7236842105263158, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8996763754045306, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14780230820178986, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8360215053763441, "eval_overall_precision": 0.783375314861461, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3493, "eval_samples_per_second": 535.387, "eval_steps_per_second": 8.589, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.6384713053703308, "learning_rate": 2.7000000000000002e-05, "loss": 0.0454, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7272727272727273, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6292134831460674, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.732394366197183, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14535315334796906, "eval_overall_accuracy": 0.9626576139670223, "eval_overall_f1": 0.8342245989304813, "eval_overall_precision": 0.7780548628428927, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3518, "eval_samples_per_second": 531.582, "eval_steps_per_second": 8.528, "step": 4876 }, { "epoch": 47.0, "grad_norm": 3.3819124698638916, "learning_rate": 2.6500000000000004e-05, "loss": 0.049, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7108433734939759, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5841584158415841, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15948139131069183, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8188976377952757, "eval_overall_precision": 0.7518072289156627, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3491, "eval_samples_per_second": 535.655, "eval_steps_per_second": 8.593, "step": 4982 }, { "epoch": 48.0, "grad_norm": 0.692154049873352, "learning_rate": 2.6000000000000002e-05, "loss": 0.0467, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7272727272727273, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6292134831460674, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14814431965351105, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8255659121171772, "eval_overall_precision": 0.7673267326732673, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.35, "eval_samples_per_second": 534.257, "eval_steps_per_second": 8.571, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.21525277197360992, "learning_rate": 2.5500000000000003e-05, "loss": 0.0458, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7450980392156863, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6477272727272727, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7027027027027027, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6341463414634146, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15645316243171692, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8293333333333333, "eval_overall_precision": 0.771712158808933, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3516, "eval_samples_per_second": 531.919, "eval_steps_per_second": 8.533, "step": 5194 }, { "epoch": 50.0, "grad_norm": 0.6371389031410217, "learning_rate": 2.5e-05, "loss": 0.0435, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8258064516129031, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7105263157894737, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1588226705789566, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8266666666666667, "eval_overall_precision": 0.7692307692307693, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3498, "eval_samples_per_second": 534.657, "eval_steps_per_second": 8.577, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.3768903613090515, "learning_rate": 2.45e-05, "loss": 0.0461, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7044025157232704, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5957446808510638, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16307169198989868, "eval_overall_accuracy": 0.9558680892337537, "eval_overall_f1": 0.8125819134993448, "eval_overall_precision": 0.7451923076923077, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3494, "eval_samples_per_second": 535.279, "eval_steps_per_second": 8.587, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.7790448665618896, "learning_rate": 2.4e-05, "loss": 0.0424, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7215189873417722, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6129032258064516, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17204023897647858, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8302387267904509, "eval_overall_precision": 0.769041769041769, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3508, "eval_samples_per_second": 533.066, "eval_steps_per_second": 8.552, "step": 5512 }, { "epoch": 53.0, "grad_norm": 0.5764625072479248, "learning_rate": 2.35e-05, "loss": 0.0436, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.8025477707006369, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7325581395348837, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7142857142857142, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5825242718446602, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.9102564102564102, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8765432098765432, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 28, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1814979910850525, "eval_overall_accuracy": 0.9529582929194956, "eval_overall_f1": 0.8195876288659794, "eval_overall_precision": 0.7412587412587412, "eval_overall_recall": 0.9164265129682997, "eval_runtime": 0.3501, "eval_samples_per_second": 534.111, "eval_steps_per_second": 8.569, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.7614324688911438, "learning_rate": 2.3000000000000003e-05, "loss": 0.0414, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7354838709677419, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6333333333333333, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1521797627210617, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8315508021390374, "eval_overall_precision": 0.7755610972568578, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3503, "eval_samples_per_second": 533.843, "eval_steps_per_second": 8.564, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.6456512212753296, "learning_rate": 2.25e-05, "loss": 0.0413, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7450980392156863, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6477272727272727, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15478459000587463, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.834008097165992, "eval_overall_precision": 0.7842639593908629, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3506, "eval_samples_per_second": 533.435, "eval_steps_per_second": 8.558, "step": 5830 }, { "epoch": 56.0, "grad_norm": 1.6711740493774414, "learning_rate": 2.2000000000000003e-05, "loss": 0.04, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8496732026143791, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7926829268292683, "eval_LOCATION_recall": 0.9154929577464789, "eval_ORGANIZATION_f1": 0.728476821192053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1626283824443817, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8337801608579088, "eval_overall_precision": 0.7794486215538847, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.35, "eval_samples_per_second": 534.232, "eval_steps_per_second": 8.571, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.47535088658332825, "learning_rate": 2.15e-05, "loss": 0.0416, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16426201164722443, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8299866131191432, "eval_overall_precision": 0.775, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3497, "eval_samples_per_second": 534.703, "eval_steps_per_second": 8.578, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.42809298634529114, "learning_rate": 2.1e-05, "loss": 0.0409, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8421052631578947, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7272727272727273, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6292134831460674, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8917197452229298, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6835443037974683, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5869565217391305, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15997961163520813, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8269484808454426, "eval_overall_precision": 0.7634146341463415, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3495, "eval_samples_per_second": 535.11, "eval_steps_per_second": 8.585, "step": 6148 }, { "epoch": 59.0, "grad_norm": 1.3752318620681763, "learning_rate": 2.05e-05, "loss": 0.0392, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8831168831168831, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8607594936708861, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1547561138868332, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8232118758434548, "eval_overall_precision": 0.7741116751269036, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3499, "eval_samples_per_second": 534.45, "eval_steps_per_second": 8.574, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.807634711265564, "learning_rate": 2e-05, "loss": 0.0374, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.8476821192052981, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15809109807014465, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8394062078272604, "eval_overall_precision": 0.7893401015228426, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3505, "eval_samples_per_second": 533.596, "eval_steps_per_second": 8.56, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.2931790351867676, "learning_rate": 1.9500000000000003e-05, "loss": 0.0365, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8421052631578947, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7515923566878981, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6413043478260869, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16991622745990753, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8411214953271029, "eval_overall_precision": 0.7835820895522388, "eval_overall_recall": 0.9077809798270894, "eval_runtime": 0.3512, "eval_samples_per_second": 532.476, "eval_steps_per_second": 8.542, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.6080542802810669, "learning_rate": 1.9e-05, "loss": 0.0367, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8441558441558441, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7831325301204819, "eval_LOCATION_recall": 0.9154929577464789, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8859934853420196, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8662420382165605, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1723637729883194, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8317631224764469, "eval_overall_precision": 0.7803030303030303, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3492, "eval_samples_per_second": 535.569, "eval_steps_per_second": 8.592, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.6744797825813293, "learning_rate": 1.85e-05, "loss": 0.0365, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.8289473684210527, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7169811320754718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6063829787234043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8802588996763754, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16163378953933716, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8244680851063829, "eval_overall_precision": 0.7654320987654321, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3516, "eval_samples_per_second": 531.858, "eval_steps_per_second": 8.532, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.468826025724411, "learning_rate": 1.8e-05, "loss": 0.0355, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17165683209896088, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.824, "eval_overall_precision": 0.7667493796526055, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3518, "eval_samples_per_second": 531.527, "eval_steps_per_second": 8.527, "step": 6784 }, { "epoch": 65.0, "grad_norm": 1.1759960651397705, "learning_rate": 1.75e-05, "loss": 0.0372, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.8258064516129031, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16856727004051208, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8308921438082557, "eval_overall_precision": 0.7722772277227723, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3518, "eval_samples_per_second": 531.563, "eval_steps_per_second": 8.528, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.6541854739189148, "learning_rate": 1.7000000000000003e-05, "loss": 0.0362, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.728395061728395, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6082474226804123, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18290750682353973, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8241469816272966, "eval_overall_precision": 0.7566265060240964, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3503, "eval_samples_per_second": 533.882, "eval_steps_per_second": 8.565, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.5697064995765686, "learning_rate": 1.65e-05, "loss": 0.0333, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7388535031847134, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6304347826086957, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8996763754045306, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17202883958816528, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8320000000000001, "eval_overall_precision": 0.7741935483870968, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3506, "eval_samples_per_second": 533.421, "eval_steps_per_second": 8.558, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.7047253251075745, "learning_rate": 1.6000000000000003e-05, "loss": 0.033, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.8258064516129031, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7307692307692307, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6263736263736264, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16683901846408844, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8313413014608233, "eval_overall_precision": 0.770935960591133, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3497, "eval_samples_per_second": 534.689, "eval_steps_per_second": 8.578, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.8004153370857239, "learning_rate": 1.55e-05, "loss": 0.0333, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8441558441558441, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7831325301204819, "eval_LOCATION_recall": 0.9154929577464789, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1638197898864746, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8351063829787235, "eval_overall_precision": 0.7753086419753087, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3527, "eval_samples_per_second": 530.148, "eval_steps_per_second": 8.505, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.29508113861083984, "learning_rate": 1.5e-05, "loss": 0.0335, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.8496732026143791, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7926829268292683, "eval_LOCATION_recall": 0.9154929577464789, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6551724137931034, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17051611840724945, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8380187416331996, "eval_overall_precision": 0.7825, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3495, "eval_samples_per_second": 535.056, "eval_steps_per_second": 8.584, "step": 7420 }, { "epoch": 71.0, "grad_norm": 1.538805365562439, "learning_rate": 1.45e-05, "loss": 0.0353, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7080745341614907, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.59375, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8917197452229298, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19078566133975983, "eval_overall_accuracy": 0.9544131910766246, "eval_overall_f1": 0.814621409921671, "eval_overall_precision": 0.7446300715990454, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3503, "eval_samples_per_second": 533.879, "eval_steps_per_second": 8.565, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.9210314750671387, "learning_rate": 1.4000000000000001e-05, "loss": 0.0324, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7236842105263158, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1728380173444748, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8277703604806409, "eval_overall_precision": 0.7711442786069652, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3513, "eval_samples_per_second": 532.244, "eval_steps_per_second": 8.539, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.4661843776702881, "learning_rate": 1.3500000000000001e-05, "loss": 0.0323, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7388535031847134, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6304347826086957, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17989809811115265, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8260292164674636, "eval_overall_precision": 0.7660098522167488, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3497, "eval_samples_per_second": 534.723, "eval_steps_per_second": 8.578, "step": 7738 }, { "epoch": 74.0, "grad_norm": 1.6226832866668701, "learning_rate": 1.3000000000000001e-05, "loss": 0.0321, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8344370860927152, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1787552833557129, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8277703604806409, "eval_overall_precision": 0.7711442786069652, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3512, "eval_samples_per_second": 532.488, "eval_steps_per_second": 8.543, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.3848640024662018, "learning_rate": 1.25e-05, "loss": 0.0296, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18127557635307312, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.827127659574468, "eval_overall_precision": 0.7679012345679013, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3512, "eval_samples_per_second": 532.43, "eval_steps_per_second": 8.542, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.07505329698324203, "learning_rate": 1.2e-05, "loss": 0.0308, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.8344370860927152, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7169811320754718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6063829787234043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8888888888888887, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8717948717948718, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17781808972358704, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8277703604806409, "eval_overall_precision": 0.7711442786069652, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3505, "eval_samples_per_second": 533.468, "eval_steps_per_second": 8.558, "step": 8056 }, { "epoch": 77.0, "grad_norm": 1.183031439781189, "learning_rate": 1.1500000000000002e-05, "loss": 0.0305, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7199999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6352941176470588, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18227067589759827, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8262032085561497, "eval_overall_precision": 0.770573566084788, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3499, "eval_samples_per_second": 534.482, "eval_steps_per_second": 8.575, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.4748055636882782, "learning_rate": 1.1000000000000001e-05, "loss": 0.0298, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8387096774193548, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7738095238095238, "eval_LOCATION_recall": 0.9154929577464789, "eval_ORGANIZATION_f1": 0.7236842105263158, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1802036613225937, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8315508021390374, "eval_overall_precision": 0.7755610972568578, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3497, "eval_samples_per_second": 534.703, "eval_steps_per_second": 8.578, "step": 8268 }, { "epoch": 79.0, "grad_norm": 1.2819609642028809, "learning_rate": 1.05e-05, "loss": 0.0302, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.728476821192053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18992583453655243, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8286852589641435, "eval_overall_precision": 0.7684729064039408, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3507, "eval_samples_per_second": 533.193, "eval_steps_per_second": 8.554, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.5597596168518066, "learning_rate": 1e-05, "loss": 0.0307, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8533333333333334, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7066666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6842105263157895, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6046511627906976, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18140378594398499, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8230563002680964, "eval_overall_precision": 0.7694235588972431, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3504, "eval_samples_per_second": 533.729, "eval_steps_per_second": 8.562, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.40338334441185, "learning_rate": 9.5e-06, "loss": 0.0275, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.8366013071895425, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18396371603012085, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8262032085561497, "eval_overall_precision": 0.770573566084788, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3499, "eval_samples_per_second": 534.509, "eval_steps_per_second": 8.575, "step": 8586 }, { "epoch": 82.0, "grad_norm": 0.6464970111846924, "learning_rate": 9e-06, "loss": 0.0285, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8496732026143791, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7926829268292683, "eval_LOCATION_recall": 0.9154929577464789, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6179775280898876, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18916206061840057, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8255659121171772, "eval_overall_precision": 0.7673267326732673, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3508, "eval_samples_per_second": 533.079, "eval_steps_per_second": 8.552, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.22236359119415283, "learning_rate": 8.500000000000002e-06, "loss": 0.0303, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.8366013071895425, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7051282051282052, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6043956043956044, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18220850825309753, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8207171314741034, "eval_overall_precision": 0.7610837438423645, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3506, "eval_samples_per_second": 533.426, "eval_steps_per_second": 8.558, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.35181981325149536, "learning_rate": 8.000000000000001e-06, "loss": 0.0291, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6973684210526315, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6091954022988506, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1842212826013565, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.8164893617021276, "eval_overall_precision": 0.7580246913580246, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3505, "eval_samples_per_second": 533.572, "eval_steps_per_second": 8.56, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.7243216037750244, "learning_rate": 7.5e-06, "loss": 0.0275, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.6883116883116883, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5955056179775281, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18761229515075684, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8191489361702129, "eval_overall_precision": 0.7604938271604939, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3509, "eval_samples_per_second": 532.932, "eval_steps_per_second": 8.55, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.5909172296524048, "learning_rate": 7.000000000000001e-06, "loss": 0.0286, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7388535031847134, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6304347826086957, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8954248366013071, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8782051282051282, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1853346824645996, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8282290279627165, "eval_overall_precision": 0.7698019801980198, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3502, "eval_samples_per_second": 533.924, "eval_steps_per_second": 8.566, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.7483916878700256, "learning_rate": 6.5000000000000004e-06, "loss": 0.0283, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8289473684210527, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7295597484276729, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6170212765957447, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1859874278306961, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8244680851063829, "eval_overall_precision": 0.7654320987654321, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3491, "eval_samples_per_second": 535.601, "eval_steps_per_second": 8.593, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.6192948222160339, "learning_rate": 6e-06, "loss": 0.0278, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8289473684210527, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7354838709677419, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6333333333333333, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1810171753168106, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8315508021390374, "eval_overall_precision": 0.7755610972568578, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3504, "eval_samples_per_second": 533.64, "eval_steps_per_second": 8.561, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.5605934858322144, "learning_rate": 5.500000000000001e-06, "loss": 0.0277, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.8421052631578947, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.9014084507042254, "eval_ORGANIZATION_f1": 0.7124999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18933603167533875, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.820580474934037, "eval_overall_precision": 0.7566909975669099, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3526, "eval_samples_per_second": 530.391, "eval_steps_per_second": 8.509, "step": 9434 }, { "epoch": 90.0, "grad_norm": 0.2893717586994171, "learning_rate": 5e-06, "loss": 0.0274, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6179775280898876, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7123287671232875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18061868846416473, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8176943699731903, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3513, "eval_samples_per_second": 532.297, "eval_steps_per_second": 8.54, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.9740373492240906, "learning_rate": 4.5e-06, "loss": 0.0262, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.708860759493671, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6021505376344086, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18925167620182037, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.8100263852242744, "eval_overall_precision": 0.7469586374695864, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3493, "eval_samples_per_second": 535.417, "eval_steps_per_second": 8.59, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.1865842491388321, "learning_rate": 4.000000000000001e-06, "loss": 0.0263, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7466666666666668, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6588235294117647, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7123287671232875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18539157509803772, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8203753351206434, "eval_overall_precision": 0.7669172932330827, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3492, "eval_samples_per_second": 535.496, "eval_steps_per_second": 8.591, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.1964859962463379, "learning_rate": 3.5000000000000004e-06, "loss": 0.0253, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.713375796178344, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.189639613032341, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8158940397350992, "eval_overall_precision": 0.7549019607843137, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.351, "eval_samples_per_second": 532.764, "eval_steps_per_second": 8.547, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.6065542101860046, "learning_rate": 3e-06, "loss": 0.0246, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.713375796178344, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8766233766233766, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8544303797468354, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18659386038780212, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8144192256341789, "eval_overall_precision": 0.7587064676616916, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3514, "eval_samples_per_second": 532.142, "eval_steps_per_second": 8.537, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.47104644775390625, "learning_rate": 2.5e-06, "loss": 0.0277, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7368421052631579, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6436781609195402, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8737864077669903, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8490566037735849, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18918968737125397, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8155080213903744, "eval_overall_precision": 0.7605985037406484, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3518, "eval_samples_per_second": 531.589, "eval_steps_per_second": 8.528, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.6074219346046448, "learning_rate": 2.0000000000000003e-06, "loss": 0.0261, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.717948717948718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6153846153846154, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18794935941696167, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8175765645805593, "eval_overall_precision": 0.7599009900990099, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3495, "eval_samples_per_second": 534.995, "eval_steps_per_second": 8.583, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.5106649398803711, "learning_rate": 1.5e-06, "loss": 0.025, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8157894736842104, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7189542483660131, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18944178521633148, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.816, "eval_overall_precision": 0.7593052109181141, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3495, "eval_samples_per_second": 535.094, "eval_steps_per_second": 8.584, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.6887297034263611, "learning_rate": 1.0000000000000002e-06, "loss": 0.0257, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.713375796178344, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19144974648952484, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8148148148148148, "eval_overall_precision": 0.7530562347188264, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3502, "eval_samples_per_second": 533.939, "eval_steps_per_second": 8.566, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.14230668544769287, "learning_rate": 5.000000000000001e-07, "loss": 0.0274, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.713375796178344, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19010868668556213, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8158940397350992, "eval_overall_precision": 0.7549019607843137, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3511, "eval_samples_per_second": 532.588, "eval_steps_per_second": 8.544, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.5434573292732239, "learning_rate": 0.0, "loss": 0.0256, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.717948717948718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6153846153846154, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18971124291419983, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.816976127320955, "eval_overall_precision": 0.7567567567567568, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3511, "eval_samples_per_second": 532.586, "eval_steps_per_second": 8.544, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5123217774191952.0, "train_loss": 0.07423505819068765, "train_runtime": 606.268, "train_samples_per_second": 278.425, "train_steps_per_second": 17.484 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5123217774191952.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }