{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.5185272693634033, "learning_rate": 4.9500000000000004e-05, "loss": 0.9922, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.012048192771084338, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.0625, "eval_PERSON_recall": 0.006666666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 28, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.5609568953514099, "eval_overall_accuracy": 0.8435984481086324, "eval_overall_f1": 0.005347593582887699, "eval_overall_precision": 0.037037037037037035, "eval_overall_recall": 0.002881844380403458, "eval_runtime": 0.385, "eval_samples_per_second": 485.683, "eval_steps_per_second": 7.792, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.2335773706436157, "learning_rate": 4.9e-05, "loss": 0.4811, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.416, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.48148148148148145, "eval_LOCATION_recall": 0.36619718309859156, "eval_ORGANIZATION_f1": 0.14285714285714285, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.14754098360655737, "eval_ORGANIZATION_recall": 0.13846153846153847, "eval_PERSON_f1": 0.6887052341597797, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.5868544600938967, "eval_PERSON_recall": 0.8333333333333334, "eval_QUANTITY_f1": 0.3692307692307692, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.375, "eval_QUANTITY_recall": 0.36363636363636365, "eval_TIME_f1": 0.7586206896551724, "eval_TIME_number": 28, "eval_TIME_precision": 0.7333333333333333, "eval_TIME_recall": 0.7857142857142857, "eval_loss": 0.32625189423561096, "eval_overall_accuracy": 0.9093113482056256, "eval_overall_f1": 0.5264586160108549, "eval_overall_precision": 0.49743589743589745, "eval_overall_recall": 0.5590778097982709, "eval_runtime": 0.3863, "eval_samples_per_second": 484.036, "eval_steps_per_second": 7.765, "step": 212 }, { "epoch": 3.0, "grad_norm": 0.693739652633667, "learning_rate": 4.85e-05, "loss": 0.2923, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.6103896103896105, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5662650602409639, "eval_LOCATION_recall": 0.6619718309859155, "eval_ORGANIZATION_f1": 0.47619047619047616, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.4268292682926829, "eval_ORGANIZATION_recall": 0.5384615384615384, "eval_PERSON_f1": 0.8348909657320873, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.783625730994152, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.6133333333333334, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5476190476190477, "eval_QUANTITY_recall": 0.696969696969697, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19018957018852234, "eval_overall_accuracy": 0.9338021338506305, "eval_overall_f1": 0.6948480845442536, "eval_overall_precision": 0.6414634146341464, "eval_overall_recall": 0.7579250720461095, "eval_runtime": 0.3873, "eval_samples_per_second": 482.829, "eval_steps_per_second": 7.746, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.1100132465362549, "learning_rate": 4.8e-05, "loss": 0.2082, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.7388535031847132, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6744186046511628, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.638036809815951, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5306122448979592, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8589341692789968, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8106508875739645, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15403173863887787, "eval_overall_accuracy": 0.9459262851600388, "eval_overall_f1": 0.7700258397932818, "eval_overall_precision": 0.6978922716627635, "eval_overall_recall": 0.8587896253602305, "eval_runtime": 0.3828, "eval_samples_per_second": 488.521, "eval_steps_per_second": 7.837, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.3037128448486328, "learning_rate": 4.75e-05, "loss": 0.1772, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7612903225806451, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.6756756756756758, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6024096385542169, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8698412698412699, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6835443037974683, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5869565217391305, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14435262978076935, "eval_overall_accuracy": 0.9512609117361784, "eval_overall_f1": 0.7889182058047493, "eval_overall_precision": 0.7274939172749392, "eval_overall_recall": 0.861671469740634, "eval_runtime": 0.3866, "eval_samples_per_second": 483.672, "eval_steps_per_second": 7.759, "step": 530 }, { "epoch": 6.0, "grad_norm": 0.9674538969993591, "learning_rate": 4.7e-05, "loss": 0.1576, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7151515151515151, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6276595744680851, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.674698795180723, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5544554455445545, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.866043613707165, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8128654970760234, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6363636363636364, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.509090909090909, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.78125, "eval_TIME_number": 28, "eval_TIME_precision": 0.6944444444444444, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1679927557706833, "eval_overall_accuracy": 0.9413191076624636, "eval_overall_f1": 0.763681592039801, "eval_overall_precision": 0.6717724288840262, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3871, "eval_samples_per_second": 483.093, "eval_steps_per_second": 7.75, "step": 636 }, { "epoch": 7.0, "grad_norm": 1.824372410774231, "learning_rate": 4.6500000000000005e-05, "loss": 0.147, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7124999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8606811145510835, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8034682080924855, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.806451612903226, "eval_TIME_number": 28, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1446426808834076, "eval_overall_accuracy": 0.9519883608147429, "eval_overall_f1": 0.7927927927927928, "eval_overall_precision": 0.7162790697674418, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3858, "eval_samples_per_second": 484.678, "eval_steps_per_second": 7.776, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.6194243431091309, "learning_rate": 4.600000000000001e-05, "loss": 0.1329, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7453416149068322, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6666666666666666, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6993865030674845, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5816326530612245, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8643533123028392, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8203592814371258, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14050208032131195, "eval_overall_accuracy": 0.9517458777885548, "eval_overall_f1": 0.7948387096774193, "eval_overall_precision": 0.719626168224299, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3902, "eval_samples_per_second": 479.194, "eval_steps_per_second": 7.688, "step": 848 }, { "epoch": 9.0, "grad_norm": 0.7105451226234436, "learning_rate": 4.55e-05, "loss": 0.1309, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.6628571428571428, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5272727272727272, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6419753086419753, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5416666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.7936507936507937, "eval_TIME_number": 28, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13999436795711517, "eval_overall_accuracy": 0.9471387002909797, "eval_overall_f1": 0.7774936061381075, "eval_overall_precision": 0.6988505747126437, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3858, "eval_samples_per_second": 484.669, "eval_steps_per_second": 7.775, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.1783398389816284, "learning_rate": 4.5e-05, "loss": 0.1247, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8653846153846153, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5777777777777777, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1291128396987915, "eval_overall_accuracy": 0.953443258971872, "eval_overall_f1": 0.7989276139410187, "eval_overall_precision": 0.7468671679197995, "eval_overall_recall": 0.8587896253602305, "eval_runtime": 0.3852, "eval_samples_per_second": 485.435, "eval_steps_per_second": 7.788, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.8099766969680786, "learning_rate": 4.4500000000000004e-05, "loss": 0.1149, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.708860759493671, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6021505376344086, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.870967741935484, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84375, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7384615384615384, "eval_TIME_number": 28, "eval_TIME_precision": 0.6486486486486487, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1423446536064148, "eval_overall_accuracy": 0.9493210475266731, "eval_overall_f1": 0.7900262467191601, "eval_overall_precision": 0.7253012048192771, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3862, "eval_samples_per_second": 484.205, "eval_steps_per_second": 7.768, "step": 1166 }, { "epoch": 12.0, "grad_norm": 0.6322067975997925, "learning_rate": 4.4000000000000006e-05, "loss": 0.1118, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7239263803680982, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6413043478260869, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7124999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8125000000000001, "eval_TIME_number": 28, "eval_TIME_precision": 0.7222222222222222, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15240532159805298, "eval_overall_accuracy": 0.9493210475266731, "eval_overall_f1": 0.7902187902187902, "eval_overall_precision": 0.713953488372093, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3875, "eval_samples_per_second": 482.64, "eval_steps_per_second": 7.743, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.8599780797958374, "learning_rate": 4.35e-05, "loss": 0.1051, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7307692307692307, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6263736263736264, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1298385113477707, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8165997322623828, "eval_overall_precision": 0.7625, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3865, "eval_samples_per_second": 483.863, "eval_steps_per_second": 7.763, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.4172143936157227, "learning_rate": 4.3e-05, "loss": 0.1071, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.858974358974359, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8271604938271605, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.75, "eval_TIME_number": 28, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13883614540100098, "eval_overall_accuracy": 0.9524733268671193, "eval_overall_f1": 0.7984084880636606, "eval_overall_precision": 0.7395577395577395, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3852, "eval_samples_per_second": 485.493, "eval_steps_per_second": 7.789, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.1519190073013306, "learning_rate": 4.25e-05, "loss": 0.1001, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14001114666461945, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8153034300791556, "eval_overall_precision": 0.7518248175182481, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3876, "eval_samples_per_second": 482.483, "eval_steps_per_second": 7.74, "step": 1590 }, { "epoch": 16.0, "grad_norm": 1.1742072105407715, "learning_rate": 4.2e-05, "loss": 0.0955, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8025477707006369, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7325581395348837, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7080745341614907, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.59375, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6753246753246752, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5909090909090909, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14204736053943634, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.806282722513089, "eval_overall_precision": 0.7386091127098321, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.386, "eval_samples_per_second": 484.409, "eval_steps_per_second": 7.771, "step": 1696 }, { "epoch": 17.0, "grad_norm": 1.7436004877090454, "learning_rate": 4.15e-05, "loss": 0.0905, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7936507936507937, "eval_TIME_number": 28, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1411171555519104, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.808, "eval_overall_precision": 0.7518610421836228, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3848, "eval_samples_per_second": 485.975, "eval_steps_per_second": 7.796, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.690143346786499, "learning_rate": 4.1e-05, "loss": 0.0882, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7006369426751592, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5978260869565217, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6315789473684211, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5581395348837209, "eval_QUANTITY_recall": 0.7272727272727273, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14777430891990662, "eval_overall_accuracy": 0.9536857419980601, "eval_overall_f1": 0.8031914893617021, "eval_overall_precision": 0.745679012345679, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3874, "eval_samples_per_second": 482.737, "eval_steps_per_second": 7.744, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.7800413370132446, "learning_rate": 4.05e-05, "loss": 0.0867, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.7755102040816326, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7272727272727272, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7027027027027027, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6341463414634146, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1365654617547989, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8049113233287859, "eval_overall_precision": 0.7642487046632125, "eval_overall_recall": 0.8501440922190202, "eval_runtime": 0.3834, "eval_samples_per_second": 487.731, "eval_steps_per_second": 7.825, "step": 2014 }, { "epoch": 20.0, "grad_norm": 1.5175530910491943, "learning_rate": 4e-05, "loss": 0.083, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.8053691275167785, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7096774193548387, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8766233766233766, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8544303797468354, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.732394366197183, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14018449187278748, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8135135135135135, "eval_overall_precision": 0.7659033078880407, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3864, "eval_samples_per_second": 483.986, "eval_steps_per_second": 7.764, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.6179842352867126, "learning_rate": 3.9500000000000005e-05, "loss": 0.0818, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.6993865030674845, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5816326530612245, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9049180327868852, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8903225806451613, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6419753086419753, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5416666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15062209963798523, "eval_overall_accuracy": 0.9524733268671193, "eval_overall_f1": 0.8078947368421052, "eval_overall_precision": 0.7433414043583535, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3872, "eval_samples_per_second": 482.978, "eval_steps_per_second": 7.748, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.7422575354576111, "learning_rate": 3.9000000000000006e-05, "loss": 0.0824, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7006369426751592, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5978260869565217, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8143712574850299, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14866971969604492, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.8010471204188482, "eval_overall_precision": 0.7338129496402878, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.386, "eval_samples_per_second": 484.457, "eval_steps_per_second": 7.772, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.7634256482124329, "learning_rate": 3.85e-05, "loss": 0.076, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8053691275167785, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7225806451612903, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6222222222222222, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8823529411764707, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8653846153846154, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13874635100364685, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8206521739130433, "eval_overall_precision": 0.7763496143958869, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3888, "eval_samples_per_second": 481.009, "eval_steps_per_second": 7.717, "step": 2438 }, { "epoch": 24.0, "grad_norm": 0.7481046915054321, "learning_rate": 3.8e-05, "loss": 0.0745, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7215189873417722, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6129032258064516, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7027027027027027, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6341463414634146, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14388589560985565, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.821664464993395, "eval_overall_precision": 0.7585365853658537, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3892, "eval_samples_per_second": 480.505, "eval_steps_per_second": 7.709, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.7572817206382751, "learning_rate": 3.7500000000000003e-05, "loss": 0.0731, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7169811320754718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6063829787234043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1537763774394989, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8222811671087533, "eval_overall_precision": 0.7616707616707616, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3889, "eval_samples_per_second": 480.849, "eval_steps_per_second": 7.714, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.5087524652481079, "learning_rate": 3.7e-05, "loss": 0.0713, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7482993197278912, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6707317073170732, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6493506493506495, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5681818181818182, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14748218655586243, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8144192256341789, "eval_overall_precision": 0.7587064676616916, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.388, "eval_samples_per_second": 481.928, "eval_steps_per_second": 7.731, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.3006908893585205, "learning_rate": 3.65e-05, "loss": 0.0712, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7421383647798743, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6276595744680851, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5777777777777777, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1678486168384552, "eval_overall_accuracy": 0.9517458777885548, "eval_overall_f1": 0.8089591567852438, "eval_overall_precision": 0.7451456310679612, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3877, "eval_samples_per_second": 482.392, "eval_steps_per_second": 7.739, "step": 2862 }, { "epoch": 28.0, "grad_norm": 0.8932152986526489, "learning_rate": 3.6e-05, "loss": 0.07, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7532467532467532, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.651685393258427, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6486486486486487, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.7272727272727273, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15593300759792328, "eval_overall_accuracy": 0.9544131910766246, "eval_overall_f1": 0.814516129032258, "eval_overall_precision": 0.7632241813602015, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3833, "eval_samples_per_second": 487.841, "eval_steps_per_second": 7.826, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.7077963948249817, "learning_rate": 3.55e-05, "loss": 0.0687, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.728395061728395, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6082474226804123, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8737864077669903, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8490566037735849, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.732394366197183, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.14312958717346191, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8133333333333335, "eval_overall_precision": 0.7568238213399504, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.386, "eval_samples_per_second": 484.405, "eval_steps_per_second": 7.771, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.8946846723556519, "learning_rate": 3.5e-05, "loss": 0.0665, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.8053691275167785, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7662337662337663, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6629213483146067, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1464053988456726, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.830188679245283, "eval_overall_precision": 0.779746835443038, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3875, "eval_samples_per_second": 482.538, "eval_steps_per_second": 7.741, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.43450927734375, "learning_rate": 3.45e-05, "loss": 0.0634, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7222222222222221, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15990784764289856, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8320000000000001, "eval_overall_precision": 0.7741935483870968, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3886, "eval_samples_per_second": 481.212, "eval_steps_per_second": 7.72, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.4396691620349884, "learning_rate": 3.4000000000000007e-05, "loss": 0.0602, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7388535031847134, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6304347826086957, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5952380952380952, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17173334956169128, "eval_overall_accuracy": 0.9529582929194956, "eval_overall_f1": 0.8115942028985507, "eval_overall_precision": 0.7475728155339806, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3884, "eval_samples_per_second": 481.497, "eval_steps_per_second": 7.725, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.7759618163108826, "learning_rate": 3.35e-05, "loss": 0.0633, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7222222222222221, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1525535136461258, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8228882833787465, "eval_overall_precision": 0.7803617571059431, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3944, "eval_samples_per_second": 474.17, "eval_steps_per_second": 7.607, "step": 3498 }, { "epoch": 34.0, "grad_norm": 1.0217112302780151, "learning_rate": 3.3e-05, "loss": 0.0596, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7123287671232875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8070175438596492, "eval_TIME_number": 28, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.15602585673332214, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.8154050464807437, "eval_overall_precision": 0.7561576354679803, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3873, "eval_samples_per_second": 482.884, "eval_steps_per_second": 7.747, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.47391146421432495, "learning_rate": 3.2500000000000004e-05, "loss": 0.0591, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8670886075949367, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7222222222222221, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1562255322933197, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8186666666666667, "eval_overall_precision": 0.7617866004962779, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3866, "eval_samples_per_second": 483.752, "eval_steps_per_second": 7.761, "step": 3710 }, { "epoch": 36.0, "grad_norm": 1.473497748374939, "learning_rate": 3.2000000000000005e-05, "loss": 0.0582, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7160493827160493, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5979381443298969, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1698862910270691, "eval_overall_accuracy": 0.9524733268671193, "eval_overall_f1": 0.8184210526315788, "eval_overall_precision": 0.7530266343825666, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3877, "eval_samples_per_second": 482.343, "eval_steps_per_second": 7.738, "step": 3816 }, { "epoch": 37.0, "grad_norm": 0.5742448568344116, "learning_rate": 3.15e-05, "loss": 0.0567, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.775, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6966292134831461, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7169811320754718, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6063829787234043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17796191573143005, "eval_overall_accuracy": 0.9498060135790495, "eval_overall_f1": 0.8073394495412844, "eval_overall_precision": 0.7403846153846154, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.388, "eval_samples_per_second": 481.913, "eval_steps_per_second": 7.731, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.6908618211746216, "learning_rate": 3.1e-05, "loss": 0.0568, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8053691275167785, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7482993197278912, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6707317073170732, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6933333333333334, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6190476190476191, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1589268296957016, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8216216216216217, "eval_overall_precision": 0.7735368956743003, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.388, "eval_samples_per_second": 481.961, "eval_steps_per_second": 7.732, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.37814459204673767, "learning_rate": 3.05e-05, "loss": 0.0553, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.759493670886076, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6896551724137931, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7195121951219511, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5959595959595959, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17944246530532837, "eval_overall_accuracy": 0.9500484966052376, "eval_overall_f1": 0.8120104438642298, "eval_overall_precision": 0.7422434367541766, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3887, "eval_samples_per_second": 481.06, "eval_steps_per_second": 7.718, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.3985283672809601, "learning_rate": 3e-05, "loss": 0.0522, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.7924528301886792, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.732394366197183, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16948159039020538, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8196286472148541, "eval_overall_precision": 0.7592137592137592, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3914, "eval_samples_per_second": 477.829, "eval_steps_per_second": 7.666, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.4095101058483124, "learning_rate": 2.95e-05, "loss": 0.0535, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6842105263157895, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6046511627906976, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16789713501930237, "eval_overall_accuracy": 0.9517458777885548, "eval_overall_f1": 0.8090185676392573, "eval_overall_precision": 0.7493857493857494, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.388, "eval_samples_per_second": 481.95, "eval_steps_per_second": 7.732, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.30107811093330383, "learning_rate": 2.9e-05, "loss": 0.0507, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7248322147651007, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15727120637893677, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8221024258760108, "eval_overall_precision": 0.7721518987341772, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3863, "eval_samples_per_second": 484.112, "eval_steps_per_second": 7.767, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.3901791274547577, "learning_rate": 2.8499999999999998e-05, "loss": 0.0501, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6967741935483871, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1803949922323227, "eval_overall_accuracy": 0.9524733268671193, "eval_overall_f1": 0.8100263852242744, "eval_overall_precision": 0.7469586374695864, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3846, "eval_samples_per_second": 486.163, "eval_steps_per_second": 7.799, "step": 4558 }, { "epoch": 44.0, "grad_norm": 0.7794935703277588, "learning_rate": 2.8000000000000003e-05, "loss": 0.0491, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.6918238993710691, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5851063829787234, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1680927574634552, "eval_overall_accuracy": 0.953443258971872, "eval_overall_f1": 0.8105960264900663, "eval_overall_precision": 0.75, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3905, "eval_samples_per_second": 478.896, "eval_steps_per_second": 7.683, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.7887659072875977, "learning_rate": 2.7500000000000004e-05, "loss": 0.0478, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16480599343776703, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8297297297297298, "eval_overall_precision": 0.7811704834605598, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3862, "eval_samples_per_second": 484.229, "eval_steps_per_second": 7.768, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.7143243551254272, "learning_rate": 2.7000000000000002e-05, "loss": 0.0475, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.7898089171974522, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7209302325581395, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15505646169185638, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.824631860776439, "eval_overall_precision": 0.77, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3852, "eval_samples_per_second": 485.438, "eval_steps_per_second": 7.788, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.987457811832428, "learning_rate": 2.6500000000000004e-05, "loss": 0.0462, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7189542483660131, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16851799190044403, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8139223560910308, "eval_overall_precision": 0.76, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3874, "eval_samples_per_second": 482.688, "eval_steps_per_second": 7.744, "step": 4982 }, { "epoch": 48.0, "grad_norm": 0.8889041543006897, "learning_rate": 2.6000000000000002e-05, "loss": 0.0467, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7333333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17139677703380585, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3861, "eval_samples_per_second": 484.347, "eval_steps_per_second": 7.77, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.43323248624801636, "learning_rate": 2.5500000000000003e-05, "loss": 0.0462, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7714285714285715, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1640593409538269, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8288043478260869, "eval_overall_precision": 0.7840616966580977, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.387, "eval_samples_per_second": 483.195, "eval_steps_per_second": 7.752, "step": 5194 }, { "epoch": 50.0, "grad_norm": 1.8610317707061768, "learning_rate": 2.5e-05, "loss": 0.0467, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16927781701087952, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8183041722745625, "eval_overall_precision": 0.7676767676767676, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3858, "eval_samples_per_second": 484.671, "eval_steps_per_second": 7.775, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.744925320148468, "learning_rate": 2.45e-05, "loss": 0.0437, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7898089171974522, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7209302325581395, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6896551724137931, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17594219744205475, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8075370121130553, "eval_overall_precision": 0.7575757575757576, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.3885, "eval_samples_per_second": 481.339, "eval_steps_per_second": 7.722, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.9806845784187317, "learning_rate": 2.4e-05, "loss": 0.0435, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8025477707006369, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7325581395348837, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18336325883865356, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8273092369477911, "eval_overall_precision": 0.7725, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3874, "eval_samples_per_second": 482.693, "eval_steps_per_second": 7.744, "step": 5512 }, { "epoch": 53.0, "grad_norm": 0.8235753178596497, "learning_rate": 2.35e-05, "loss": 0.0441, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7307692307692307, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6263736263736264, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1896522045135498, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.8249336870026525, "eval_overall_precision": 0.7641277641277642, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3854, "eval_samples_per_second": 485.247, "eval_steps_per_second": 7.785, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.6915778517723083, "learning_rate": 2.3000000000000003e-05, "loss": 0.042, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7402597402597403, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6404494382022472, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18752093613147736, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.8196286472148541, "eval_overall_precision": 0.7592137592137592, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3868, "eval_samples_per_second": 483.48, "eval_steps_per_second": 7.756, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.8931111097335815, "learning_rate": 2.25e-05, "loss": 0.0414, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.7974683544303797, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.6923076923076923, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5934065934065934, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6842105263157895, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6046511627906976, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18678565323352814, "eval_overall_accuracy": 0.9544131910766246, "eval_overall_f1": 0.8031496062992126, "eval_overall_precision": 0.7373493975903614, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3898, "eval_samples_per_second": 479.751, "eval_steps_per_second": 7.697, "step": 5830 }, { "epoch": 56.0, "grad_norm": 0.4860210418701172, "learning_rate": 2.2000000000000003e-05, "loss": 0.0408, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7152317880794703, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.627906976744186, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.732394366197183, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17208231985569, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8161073825503355, "eval_overall_precision": 0.7638190954773869, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.388, "eval_samples_per_second": 481.966, "eval_steps_per_second": 7.732, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.5651527047157288, "learning_rate": 2.15e-05, "loss": 0.0388, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7222222222222222, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6582278481012658, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7123287671232875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.18390165269374847, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8178137651821863, "eval_overall_precision": 0.7690355329949239, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3854, "eval_samples_per_second": 485.204, "eval_steps_per_second": 7.784, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.2999099791049957, "learning_rate": 2.1e-05, "loss": 0.039, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7006369426751592, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5978260869565217, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7123287671232875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17726965248584747, "eval_overall_accuracy": 0.9527158098933075, "eval_overall_f1": 0.8095872170439414, "eval_overall_precision": 0.7524752475247525, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3868, "eval_samples_per_second": 483.452, "eval_steps_per_second": 7.756, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.43868881464004517, "learning_rate": 2.05e-05, "loss": 0.0414, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16531790792942047, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8184281842818427, "eval_overall_precision": 0.7723785166240409, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3862, "eval_samples_per_second": 484.265, "eval_steps_per_second": 7.769, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.5318551659584045, "learning_rate": 2e-05, "loss": 0.0379, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.7808219178082192, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.76, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7172413793103448, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1694074124097824, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8142076502732241, "eval_overall_precision": 0.7740259740259741, "eval_overall_recall": 0.8587896253602305, "eval_runtime": 0.387, "eval_samples_per_second": 483.234, "eval_steps_per_second": 7.752, "step": 6360 }, { "epoch": 61.0, "grad_norm": 1.2059674263000488, "learning_rate": 1.9500000000000003e-05, "loss": 0.0391, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7123287671232875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1873074322938919, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8138297872340426, "eval_overall_precision": 0.7555555555555555, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3877, "eval_samples_per_second": 482.378, "eval_steps_per_second": 7.739, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.812824010848999, "learning_rate": 1.9e-05, "loss": 0.0372, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7248322147651007, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17852064967155457, "eval_overall_accuracy": 0.9558680892337537, "eval_overall_f1": 0.8176943699731903, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3884, "eval_samples_per_second": 481.406, "eval_steps_per_second": 7.723, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.8590715527534485, "learning_rate": 1.85e-05, "loss": 0.0371, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17511434853076935, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8232118758434548, "eval_overall_precision": 0.7741116751269036, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3869, "eval_samples_per_second": 483.268, "eval_steps_per_second": 7.753, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.4557998478412628, "learning_rate": 1.8e-05, "loss": 0.0348, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7248322147651007, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7714285714285715, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1811322569847107, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.825268817204301, "eval_overall_precision": 0.7732997481108312, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3896, "eval_samples_per_second": 479.954, "eval_steps_per_second": 7.7, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.6341075897216797, "learning_rate": 1.75e-05, "loss": 0.0338, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1845623105764389, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8203753351206434, "eval_overall_precision": 0.7669172932330827, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.389, "eval_samples_per_second": 480.742, "eval_steps_per_second": 7.712, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.8572676777839661, "learning_rate": 1.7000000000000003e-05, "loss": 0.033, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7848101265822784, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7126436781609196, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.728476821192053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1916947364807129, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.8207171314741034, "eval_overall_precision": 0.7610837438423645, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3919, "eval_samples_per_second": 477.125, "eval_steps_per_second": 7.654, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.2351032942533493, "learning_rate": 1.65e-05, "loss": 0.0347, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.8079470198675496, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7019867549668873, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18072670698165894, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8189189189189189, "eval_overall_precision": 0.7709923664122137, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.387, "eval_samples_per_second": 483.214, "eval_steps_per_second": 7.752, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.4664683938026428, "learning_rate": 1.6000000000000003e-05, "loss": 0.034, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8670886075949367, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1870609074831009, "eval_overall_accuracy": 0.9558680892337537, "eval_overall_f1": 0.8165997322623828, "eval_overall_precision": 0.7625, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3901, "eval_samples_per_second": 479.405, "eval_steps_per_second": 7.691, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.3841381072998047, "learning_rate": 1.55e-05, "loss": 0.0319, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.775, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6966292134831461, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.654320987654321, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18617138266563416, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7630922693266833, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3873, "eval_samples_per_second": 482.77, "eval_steps_per_second": 7.745, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.48607921600341797, "learning_rate": 1.5e-05, "loss": 0.0338, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7199999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6352941176470588, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1894809454679489, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.824631860776439, "eval_overall_precision": 0.77, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3876, "eval_samples_per_second": 482.49, "eval_steps_per_second": 7.74, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.6728916168212891, "learning_rate": 1.45e-05, "loss": 0.0306, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.728476821192053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20611025393009186, "eval_overall_accuracy": 0.9558680892337537, "eval_overall_f1": 0.8202396804260986, "eval_overall_precision": 0.7623762376237624, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3871, "eval_samples_per_second": 483.102, "eval_steps_per_second": 7.75, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.954484760761261, "learning_rate": 1.4000000000000001e-05, "loss": 0.0343, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19823096692562103, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.8202396804260986, "eval_overall_precision": 0.7623762376237624, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.388, "eval_samples_per_second": 482.019, "eval_steps_per_second": 7.733, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.27965471148490906, "learning_rate": 1.3500000000000001e-05, "loss": 0.0308, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7586206896551724, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.732394366197183, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19675639271736145, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8247978436657682, "eval_overall_precision": 0.7746835443037975, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3857, "eval_samples_per_second": 484.852, "eval_steps_per_second": 7.778, "step": 7738 }, { "epoch": 74.0, "grad_norm": 1.283292531967163, "learning_rate": 1.3000000000000001e-05, "loss": 0.0328, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.654320987654321, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19934506714344025, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.8172043010752689, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3861, "eval_samples_per_second": 484.375, "eval_steps_per_second": 7.771, "step": 7844 }, { "epoch": 75.0, "grad_norm": 1.0608142614364624, "learning_rate": 1.25e-05, "loss": 0.0328, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7333333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19247645139694214, "eval_overall_accuracy": 0.9558680892337537, "eval_overall_f1": 0.814516129032258, "eval_overall_precision": 0.7632241813602015, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3881, "eval_samples_per_second": 481.827, "eval_steps_per_second": 7.73, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.5310276746749878, "learning_rate": 1.2e-05, "loss": 0.0314, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.732394366197183, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19101466238498688, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.8151147098515519, "eval_overall_precision": 0.766497461928934, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3899, "eval_samples_per_second": 479.552, "eval_steps_per_second": 7.693, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.7759119868278503, "learning_rate": 1.1500000000000002e-05, "loss": 0.0304, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7027027027027027, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6265060240963856, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19821016490459442, "eval_overall_accuracy": 0.9544131910766246, "eval_overall_f1": 0.8037383177570094, "eval_overall_precision": 0.7487562189054726, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3868, "eval_samples_per_second": 483.476, "eval_steps_per_second": 7.756, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.5382179021835327, "learning_rate": 1.1000000000000001e-05, "loss": 0.0318, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7105263157894737, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6578947368421053, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5813953488372093, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.2088189721107483, "eval_overall_accuracy": 0.9527158098933075, "eval_overall_f1": 0.7994722955145119, "eval_overall_precision": 0.7372262773722628, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3886, "eval_samples_per_second": 481.155, "eval_steps_per_second": 7.719, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.7348619103431702, "learning_rate": 1.05e-05, "loss": 0.0303, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.654320987654321, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.704225352112676, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20289956033229828, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.8074866310160428, "eval_overall_precision": 0.7531172069825436, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3879, "eval_samples_per_second": 482.085, "eval_steps_per_second": 7.734, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.42746540904045105, "learning_rate": 1e-05, "loss": 0.0289, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7210884353741497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6463414634146342, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6944444444444444, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.2005331665277481, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.8032345013477089, "eval_overall_precision": 0.7544303797468355, "eval_overall_recall": 0.8587896253602305, "eval_runtime": 0.385, "eval_samples_per_second": 485.722, "eval_steps_per_second": 7.792, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.303906112909317, "learning_rate": 9.5e-06, "loss": 0.0283, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.704225352112676, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20049220323562622, "eval_overall_accuracy": 0.9558680892337537, "eval_overall_f1": 0.8113207547169812, "eval_overall_precision": 0.7620253164556962, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3858, "eval_samples_per_second": 484.734, "eval_steps_per_second": 7.776, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.8275718688964844, "learning_rate": 9e-06, "loss": 0.0303, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7333333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7142857142857142, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19804218411445618, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8167115902964959, "eval_overall_precision": 0.7670886075949367, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3865, "eval_samples_per_second": 483.795, "eval_steps_per_second": 7.761, "step": 8692 }, { "epoch": 83.0, "grad_norm": 3.0445024967193604, "learning_rate": 8.500000000000002e-06, "loss": 0.0281, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.704225352112676, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19731304049491882, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8113207547169812, "eval_overall_precision": 0.7620253164556962, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3858, "eval_samples_per_second": 484.669, "eval_steps_per_second": 7.775, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.6099753379821777, "learning_rate": 8.000000000000001e-06, "loss": 0.0281, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.7848101265822784, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7126436781609196, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7142857142857142, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20074868202209473, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8165997322623828, "eval_overall_precision": 0.7625, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3861, "eval_samples_per_second": 484.379, "eval_steps_per_second": 7.771, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.7372535467147827, "learning_rate": 7.5e-06, "loss": 0.0291, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7142857142857142, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20446744561195374, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.8123324396782842, "eval_overall_precision": 0.7593984962406015, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3888, "eval_samples_per_second": 481.027, "eval_steps_per_second": 7.717, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.5419071316719055, "learning_rate": 7.000000000000001e-06, "loss": 0.0286, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7466666666666668, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6588235294117647, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19124767184257507, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8247978436657682, "eval_overall_precision": 0.7746835443037975, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3884, "eval_samples_per_second": 481.417, "eval_steps_per_second": 7.723, "step": 9116 }, { "epoch": 87.0, "grad_norm": 1.295188546180725, "learning_rate": 6.5000000000000004e-06, "loss": 0.0267, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7466666666666668, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6588235294117647, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1960640400648117, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8241610738255033, "eval_overall_precision": 0.7713567839195979, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3903, "eval_samples_per_second": 479.159, "eval_steps_per_second": 7.687, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.27405989170074463, "learning_rate": 6e-06, "loss": 0.0282, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6849315068493151, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19417804479599, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8150134048257373, "eval_overall_precision": 0.7619047619047619, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3895, "eval_samples_per_second": 480.08, "eval_steps_per_second": 7.702, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.466235876083374, "learning_rate": 5.500000000000001e-06, "loss": 0.0251, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6849315068493151, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.2023736834526062, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.8203753351206434, "eval_overall_precision": 0.7669172932330827, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.388, "eval_samples_per_second": 481.997, "eval_steps_per_second": 7.733, "step": 9434 }, { "epoch": 90.0, "grad_norm": 0.620521068572998, "learning_rate": 5e-06, "loss": 0.027, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7714285714285715, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19653601944446564, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8297297297297298, "eval_overall_precision": 0.7811704834605598, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3866, "eval_samples_per_second": 483.702, "eval_steps_per_second": 7.76, "step": 9540 }, { "epoch": 91.0, "grad_norm": 1.394244909286499, "learning_rate": 4.5e-06, "loss": 0.0268, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.2078668475151062, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.8236877523553162, "eval_overall_precision": 0.7727272727272727, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3925, "eval_samples_per_second": 476.384, "eval_steps_per_second": 7.643, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.33064666390419006, "learning_rate": 4.000000000000001e-06, "loss": 0.0256, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7466666666666668, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6588235294117647, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19762425124645233, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8257372654155496, "eval_overall_precision": 0.7719298245614035, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3867, "eval_samples_per_second": 483.56, "eval_steps_per_second": 7.758, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.47633665800094604, "learning_rate": 3.5000000000000004e-06, "loss": 0.0258, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1961781531572342, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8214765100671141, "eval_overall_precision": 0.7688442211055276, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3869, "eval_samples_per_second": 483.349, "eval_steps_per_second": 7.754, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.8689398169517517, "learning_rate": 3e-06, "loss": 0.0233, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7466666666666668, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6588235294117647, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19755157828330994, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8214765100671141, "eval_overall_precision": 0.7688442211055276, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3876, "eval_samples_per_second": 482.46, "eval_steps_per_second": 7.74, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.12069670855998993, "learning_rate": 2.5e-06, "loss": 0.0259, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7482993197278912, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6707317073170732, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19969353079795837, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8221024258760108, "eval_overall_precision": 0.7721518987341772, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3888, "eval_samples_per_second": 480.915, "eval_steps_per_second": 7.715, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.6587622761726379, "learning_rate": 2.0000000000000003e-06, "loss": 0.0253, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20329639315605164, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.8203753351206434, "eval_overall_precision": 0.7669172932330827, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3887, "eval_samples_per_second": 481.079, "eval_steps_per_second": 7.718, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.5734129548072815, "learning_rate": 1.5e-06, "loss": 0.0251, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20106351375579834, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8225806451612904, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3868, "eval_samples_per_second": 483.477, "eval_steps_per_second": 7.756, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.6452818512916565, "learning_rate": 1.0000000000000002e-06, "loss": 0.0237, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.7948717948717949, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7294117647058823, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20484283566474915, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.823529411764706, "eval_overall_precision": 0.7680798004987531, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3875, "eval_samples_per_second": 482.528, "eval_steps_per_second": 7.741, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.052759163081645966, "learning_rate": 5.000000000000001e-07, "loss": 0.024, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20229747891426086, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8268456375838926, "eval_overall_precision": 0.7738693467336684, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3867, "eval_samples_per_second": 483.518, "eval_steps_per_second": 7.757, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.5731909871101379, "learning_rate": 0.0, "loss": 0.0257, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7428571428571429, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.2022850662469864, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8279569892473119, "eval_overall_precision": 0.7758186397984886, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3873, "eval_samples_per_second": 482.826, "eval_steps_per_second": 7.746, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5123217774191952.0, "train_loss": 0.07238403747666557, "train_runtime": 624.3551, "train_samples_per_second": 270.359, "train_steps_per_second": 16.978 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5123217774191952.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }