{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 0.8392817974090576, "learning_rate": 4.9500000000000004e-05, "loss": 0.9688, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.0879120879120879, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.26666666666666666, "eval_PERSON_recall": 0.05263157894736842, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 29, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.5576337575912476, "eval_overall_accuracy": 0.8432778489116517, "eval_overall_f1": 0.042666666666666665, "eval_overall_precision": 0.21621621621621623, "eval_overall_recall": 0.023668639053254437, "eval_runtime": 0.3335, "eval_samples_per_second": 560.647, "eval_steps_per_second": 8.994, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.1076773405075073, "learning_rate": 4.9e-05, "loss": 0.4767, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.288659793814433, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5, "eval_LOCATION_recall": 0.2028985507246377, "eval_ORGANIZATION_f1": 0.07058823529411765, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.1111111111111111, "eval_ORGANIZATION_recall": 0.05172413793103448, "eval_PERSON_f1": 0.5936739659367396, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.47104247104247104, "eval_PERSON_recall": 0.8026315789473685, "eval_QUANTITY_f1": 0.11111111111111112, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.125, "eval_QUANTITY_recall": 0.1, "eval_TIME_f1": 0.523076923076923, "eval_TIME_number": 29, "eval_TIME_precision": 0.4722222222222222, "eval_TIME_recall": 0.5862068965517241, "eval_loss": 0.31268012523651123, "eval_overall_accuracy": 0.8991037131882202, "eval_overall_f1": 0.44662921348314605, "eval_overall_precision": 0.42513368983957217, "eval_overall_recall": 0.47041420118343197, "eval_runtime": 0.3348, "eval_samples_per_second": 558.483, "eval_steps_per_second": 8.96, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.2600445747375488, "learning_rate": 4.85e-05, "loss": 0.2969, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.6303030303030303, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5416666666666666, "eval_LOCATION_recall": 0.7536231884057971, "eval_ORGANIZATION_f1": 0.4605263157894736, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.3723404255319149, "eval_ORGANIZATION_recall": 0.603448275862069, "eval_PERSON_f1": 0.8085106382978723, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.751412429378531, "eval_PERSON_recall": 0.875, "eval_QUANTITY_f1": 0.7027027027027029, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5909090909090909, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7301587301587301, "eval_TIME_number": 29, "eval_TIME_precision": 0.6764705882352942, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.22261539101600647, "eval_overall_accuracy": 0.9275288092189501, "eval_overall_f1": 0.6871008939974458, "eval_overall_precision": 0.604494382022472, "eval_overall_recall": 0.7958579881656804, "eval_runtime": 0.333, "eval_samples_per_second": 561.501, "eval_steps_per_second": 9.008, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.1735649108886719, "learning_rate": 4.8e-05, "loss": 0.2125, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.7346938775510203, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6923076923076923, "eval_LOCATION_recall": 0.782608695652174, "eval_ORGANIZATION_f1": 0.5354330708661417, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.4927536231884058, "eval_ORGANIZATION_recall": 0.5862068965517241, "eval_PERSON_f1": 0.8288288288288289, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7624309392265194, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.6944444444444444, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5952380952380952, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7076923076923076, "eval_TIME_number": 29, "eval_TIME_precision": 0.6388888888888888, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.17351830005645752, "eval_overall_accuracy": 0.9400768245838669, "eval_overall_f1": 0.7365591397849461, "eval_overall_precision": 0.6748768472906403, "eval_overall_recall": 0.8106508875739645, "eval_runtime": 0.3365, "eval_samples_per_second": 555.787, "eval_steps_per_second": 8.916, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.4631017446517944, "learning_rate": 4.75e-05, "loss": 0.1759, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.6762589928057554, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6714285714285714, "eval_LOCATION_recall": 0.6811594202898551, "eval_ORGANIZATION_f1": 0.6056338028169014, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5119047619047619, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8466257668711656, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7931034482758621, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7164179104477612, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8275862068965517, "eval_TIME_number": 29, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14357861876487732, "eval_overall_accuracy": 0.9475032010243278, "eval_overall_f1": 0.7540983606557377, "eval_overall_precision": 0.700507614213198, "eval_overall_recall": 0.8165680473372781, "eval_runtime": 0.3351, "eval_samples_per_second": 558.08, "eval_steps_per_second": 8.953, "step": 530 }, { "epoch": 6.0, "grad_norm": 0.8950690627098083, "learning_rate": 4.7e-05, "loss": 0.1548, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6811594202898551, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5875, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8518518518518517, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8023255813953488, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7142857142857143, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14464175701141357, "eval_overall_accuracy": 0.952112676056338, "eval_overall_f1": 0.7866666666666666, "eval_overall_precision": 0.7160194174757282, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3323, "eval_samples_per_second": 562.696, "eval_steps_per_second": 9.027, "step": 636 }, { "epoch": 7.0, "grad_norm": 0.48694196343421936, "learning_rate": 4.6500000000000005e-05, "loss": 0.1452, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.8289473684210527, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6870229007633589, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6164383561643836, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.875, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.6153846153846154, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14724624156951904, "eval_overall_accuracy": 0.9510883482714468, "eval_overall_f1": 0.7967698519515478, "eval_overall_precision": 0.7308641975308642, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3323, "eval_samples_per_second": 562.777, "eval_steps_per_second": 9.029, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.39879658818244934, "learning_rate": 4.600000000000001e-05, "loss": 0.1368, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.8378378378378378, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7142857142857144, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.8620689655172413, "eval_PERSON_f1": 0.8722741433021807, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8284023668639053, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.6376811594202898, "eval_TIME_number": 29, "eval_TIME_precision": 0.55, "eval_TIME_recall": 0.7586206896551724, "eval_loss": 0.1397438496351242, "eval_overall_accuracy": 0.9539052496798975, "eval_overall_f1": 0.8026845637583893, "eval_overall_precision": 0.7346437346437347, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.3334, "eval_samples_per_second": 560.876, "eval_steps_per_second": 8.998, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.2802802324295044, "learning_rate": 4.55e-05, "loss": 0.1278, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7441860465116279, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.5950413223140496, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5714285714285714, "eval_ORGANIZATION_recall": 0.6206896551724138, "eval_PERSON_f1": 0.8623853211009175, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8057142857142857, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.6571428571428573, "eval_TIME_number": 29, "eval_TIME_precision": 0.5609756097560976, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.14592860639095306, "eval_overall_accuracy": 0.9528809218950064, "eval_overall_f1": 0.7800269905533064, "eval_overall_precision": 0.71712158808933, "eval_overall_recall": 0.8550295857988166, "eval_runtime": 0.3343, "eval_samples_per_second": 559.31, "eval_steps_per_second": 8.973, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.4159973859786987, "learning_rate": 4.5e-05, "loss": 0.1202, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7209302325581395, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6614173228346457, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.877742946708464, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8383233532934131, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.6944444444444444, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5952380952380952, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8064516129032258, "eval_TIME_number": 29, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13962122797966003, "eval_overall_accuracy": 0.9559539052496799, "eval_overall_f1": 0.8, "eval_overall_precision": 0.7405541561712846, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3332, "eval_samples_per_second": 561.16, "eval_steps_per_second": 9.003, "step": 1060 }, { "epoch": 11.0, "grad_norm": 1.0556025505065918, "learning_rate": 4.4500000000000004e-05, "loss": 0.1166, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.8552631578947367, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7831325301204819, "eval_LOCATION_recall": 0.9420289855072463, "eval_ORGANIZATION_f1": 0.6515151515151516, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.581081081081081, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8392857142857143, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.6944444444444444, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5952380952380952, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13871203362941742, "eval_overall_accuracy": 0.9556978233034571, "eval_overall_f1": 0.8054054054054053, "eval_overall_precision": 0.7412935323383084, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3363, "eval_samples_per_second": 556.023, "eval_steps_per_second": 8.92, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.1935970783233643, "learning_rate": 4.4000000000000006e-05, "loss": 0.1108, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.5641025641025641, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.559322033898305, "eval_ORGANIZATION_recall": 0.5689655172413793, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13067495822906494, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8062234794908061, "eval_overall_precision": 0.7723577235772358, "eval_overall_recall": 0.8431952662721893, "eval_runtime": 0.3341, "eval_samples_per_second": 559.688, "eval_steps_per_second": 8.979, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.38182273507118225, "learning_rate": 4.35e-05, "loss": 0.1052, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.8476821192052981, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8952380952380953, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13124220073223114, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.8282548476454293, "eval_overall_precision": 0.7786458333333334, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.3361, "eval_samples_per_second": 556.458, "eval_steps_per_second": 8.927, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.8100732564926147, "learning_rate": 4.3e-05, "loss": 0.104, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6991869918699186, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6615384615384615, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.9085173501577286, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8727272727272727, "eval_PERSON_recall": 0.9473684210526315, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7419354838709677, "eval_TIME_number": 29, "eval_TIME_precision": 0.696969696969697, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.13739244639873505, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.8284518828451882, "eval_overall_precision": 0.783641160949868, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3335, "eval_samples_per_second": 560.761, "eval_steps_per_second": 8.996, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.0627801418304443, "learning_rate": 4.25e-05, "loss": 0.0963, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.8366013071895425, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6610169491525424, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.6724137931034483, "eval_PERSON_f1": 0.9102564102564101, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8875, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.6233766233766233, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5106382978723404, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13979628682136536, "eval_overall_accuracy": 0.9572343149807938, "eval_overall_f1": 0.8116343490304708, "eval_overall_precision": 0.7630208333333334, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.3344, "eval_samples_per_second": 559.247, "eval_steps_per_second": 8.972, "step": 1590 }, { "epoch": 16.0, "grad_norm": 0.8222811222076416, "learning_rate": 4.2e-05, "loss": 0.0952, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8311688311688311, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7343749999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.9067524115755626, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.676056338028169, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14147908985614777, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8287292817679558, "eval_overall_precision": 0.7772020725388601, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3348, "eval_samples_per_second": 558.612, "eval_steps_per_second": 8.962, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.7422318458557129, "learning_rate": 4.15e-05, "loss": 0.0902, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.8533333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7000000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5975609756097561, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.6315789473684211, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5217391304347826, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7540983606557378, "eval_TIME_number": 29, "eval_TIME_precision": 0.71875, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.14226044714450836, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8097165991902834, "eval_overall_precision": 0.7444168734491315, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3343, "eval_samples_per_second": 559.424, "eval_steps_per_second": 8.975, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.5720771551132202, "learning_rate": 4.1e-05, "loss": 0.0919, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6976744186046512, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6338028169014085, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.9113924050632912, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8780487804878049, "eval_PERSON_recall": 0.9473684210526315, "eval_QUANTITY_f1": 0.676056338028169, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7301587301587301, "eval_TIME_number": 29, "eval_TIME_precision": 0.6764705882352942, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.14349369704723358, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.8275862068965517, "eval_overall_precision": 0.7751937984496124, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3339, "eval_samples_per_second": 560.088, "eval_steps_per_second": 8.985, "step": 1908 }, { "epoch": 19.0, "grad_norm": 1.00640070438385, "learning_rate": 4.05e-05, "loss": 0.0864, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6885245901639345, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.65625, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.9050632911392406, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8719512195121951, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.64, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5333333333333333, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7796610169491527, "eval_TIME_number": 29, "eval_TIME_precision": 0.7666666666666667, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.14329810440540314, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.8205841446453407, "eval_overall_precision": 0.7742782152230971, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.338, "eval_samples_per_second": 553.255, "eval_steps_per_second": 8.876, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.7463036179542542, "learning_rate": 4e-05, "loss": 0.0853, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7230769230769231, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6527777777777778, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.9137380191693291, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8881987577639752, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7540983606557378, "eval_TIME_number": 29, "eval_TIME_precision": 0.71875, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.13515153527259827, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8431372549019608, "eval_overall_precision": 0.800531914893617, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.3312, "eval_samples_per_second": 564.613, "eval_steps_per_second": 9.058, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.4474703073501587, "learning_rate": 3.9500000000000005e-05, "loss": 0.0782, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.8322147651006713, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.696969696969697, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6216216216216216, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.9050632911392406, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8719512195121951, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1520513892173767, "eval_overall_accuracy": 0.9574903969270167, "eval_overall_f1": 0.8241758241758241, "eval_overall_precision": 0.7692307692307693, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3358, "eval_samples_per_second": 556.946, "eval_steps_per_second": 8.935, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.46933385729789734, "learning_rate": 3.9000000000000006e-05, "loss": 0.0778, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.8533333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7259259259259259, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8952380952380953, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14189890027046204, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8308115543328748, "eval_overall_precision": 0.7763496143958869, "eval_overall_recall": 0.893491124260355, "eval_runtime": 0.3349, "eval_samples_per_second": 558.354, "eval_steps_per_second": 8.958, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.5191448330879211, "learning_rate": 3.85e-05, "loss": 0.0751, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6976744186046512, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6338028169014085, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.9015873015873016, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1431107521057129, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8243430152143846, "eval_overall_precision": 0.7740259740259741, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3347, "eval_samples_per_second": 558.691, "eval_steps_per_second": 8.963, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.5136590003967285, "learning_rate": 3.8e-05, "loss": 0.0761, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6935483870967741, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6515151515151515, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.9079365079365079, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8773006134969326, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1410786360502243, "eval_overall_accuracy": 0.9633802816901409, "eval_overall_f1": 0.8394366197183097, "eval_overall_precision": 0.8010752688172043, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3473, "eval_samples_per_second": 538.469, "eval_steps_per_second": 8.639, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.8224151134490967, "learning_rate": 3.7500000000000003e-05, "loss": 0.0718, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6923076923076923, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.9079365079365079, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8773006134969326, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.64, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5333333333333333, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7301587301587301, "eval_TIME_number": 29, "eval_TIME_precision": 0.6764705882352942, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.15752357244491577, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8164383561643835, "eval_overall_precision": 0.7602040816326531, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3326, "eval_samples_per_second": 562.261, "eval_steps_per_second": 9.02, "step": 2650 }, { "epoch": 26.0, "grad_norm": 1.1950877904891968, "learning_rate": 3.7e-05, "loss": 0.0706, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7213114754098361, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.9166666666666667, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.89375, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14247971773147583, "eval_overall_accuracy": 0.9623559539052496, "eval_overall_f1": 0.8389830508474576, "eval_overall_precision": 0.8027027027027027, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3335, "eval_samples_per_second": 560.748, "eval_steps_per_second": 8.996, "step": 2756 }, { "epoch": 27.0, "grad_norm": 0.48883256316185, "learning_rate": 3.65e-05, "loss": 0.0675, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7101449275362319, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6125, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.890282131661442, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8502994011976048, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.6857142857142857, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.16071684658527374, "eval_overall_accuracy": 0.9559539052496799, "eval_overall_f1": 0.819538670284939, "eval_overall_precision": 0.7568922305764411, "eval_overall_recall": 0.893491124260355, "eval_runtime": 0.3357, "eval_samples_per_second": 557.057, "eval_steps_per_second": 8.937, "step": 2862 }, { "epoch": 28.0, "grad_norm": 5.45798397064209, "learning_rate": 3.6e-05, "loss": 0.0692, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7301587301587301, "eval_TIME_number": 29, "eval_TIME_precision": 0.6764705882352942, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.14975115656852722, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8205841446453407, "eval_overall_precision": 0.7742782152230971, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3351, "eval_samples_per_second": 558.088, "eval_steps_per_second": 8.953, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.3084903359413147, "learning_rate": 3.55e-05, "loss": 0.0663, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.84, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7000000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5975609756097561, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8924050632911392, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.148148775100708, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8201634877384196, "eval_overall_precision": 0.76010101010101, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.3329, "eval_samples_per_second": 561.66, "eval_steps_per_second": 9.011, "step": 3074 }, { "epoch": 30.0, "grad_norm": 1.554962396621704, "learning_rate": 3.5e-05, "loss": 0.0642, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6612903225806452, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6212121212121212, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.889589905362776, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.8253968253968254, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14457598328590393, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8338028169014083, "eval_overall_precision": 0.7956989247311828, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3355, "eval_samples_per_second": 557.403, "eval_steps_per_second": 8.942, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.40657302737236023, "learning_rate": 3.45e-05, "loss": 0.0602, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.65625, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8924050632911392, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1596260815858841, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.8189415041782729, "eval_overall_precision": 0.7736842105263158, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3328, "eval_samples_per_second": 561.9, "eval_steps_per_second": 9.014, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.3220694363117218, "learning_rate": 3.4000000000000007e-05, "loss": 0.0618, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8980891719745223, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.676056338028169, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7540983606557378, "eval_TIME_number": 29, "eval_TIME_precision": 0.71875, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.15103064477443695, "eval_overall_accuracy": 0.9605633802816902, "eval_overall_f1": 0.82336578581363, "eval_overall_precision": 0.7769028871391076, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.336, "eval_samples_per_second": 556.607, "eval_steps_per_second": 8.93, "step": 3392 }, { "epoch": 33.0, "grad_norm": 1.0746521949768066, "learning_rate": 3.35e-05, "loss": 0.0587, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6976744186046512, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6338028169014085, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.9050632911392406, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8719512195121951, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.15125295519828796, "eval_overall_accuracy": 0.9636363636363636, "eval_overall_f1": 0.840782122905028, "eval_overall_precision": 0.7962962962962963, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.3377, "eval_samples_per_second": 553.74, "eval_steps_per_second": 8.884, "step": 3498 }, { "epoch": 34.0, "grad_norm": 1.5852210521697998, "learning_rate": 3.3e-05, "loss": 0.0575, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8435374149659864, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7948717948717948, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7175572519083969, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8924050632911392, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.6857142857142857, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.696969696969697, "eval_TIME_number": 29, "eval_TIME_precision": 0.6216216216216216, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.17214131355285645, "eval_overall_accuracy": 0.9574903969270167, "eval_overall_f1": 0.8136986301369863, "eval_overall_precision": 0.7576530612244898, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.332, "eval_samples_per_second": 563.205, "eval_steps_per_second": 9.035, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.709221601486206, "learning_rate": 3.2500000000000004e-05, "loss": 0.0568, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.736, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6865671641791045, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.889589905362776, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7666666666666667, "eval_TIME_number": 29, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.16309089958667755, "eval_overall_accuracy": 0.9605633802816902, "eval_overall_f1": 0.8312412831241283, "eval_overall_precision": 0.7862796833773087, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3342, "eval_samples_per_second": 559.545, "eval_steps_per_second": 8.977, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.5662766098976135, "learning_rate": 3.2000000000000005e-05, "loss": 0.058, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.8671328671328672, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.711111111111111, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6233766233766234, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.9079365079365079, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8773006134969326, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.15275219082832336, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8412256267409471, "eval_overall_precision": 0.7947368421052632, "eval_overall_recall": 0.893491124260355, "eval_runtime": 0.3343, "eval_samples_per_second": 559.388, "eval_steps_per_second": 8.974, "step": 3816 }, { "epoch": 37.0, "grad_norm": 0.11498302221298218, "learning_rate": 3.15e-05, "loss": 0.0542, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6285714285714286, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.9015873015873016, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1606374979019165, "eval_overall_accuracy": 0.9597951344430218, "eval_overall_f1": 0.8272980501392758, "eval_overall_precision": 0.781578947368421, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.334, "eval_samples_per_second": 559.858, "eval_steps_per_second": 8.982, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.5296043157577515, "learning_rate": 3.1e-05, "loss": 0.0543, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6153846153846154, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.9038461538461539, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.88125, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5714285714285714, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.16339102387428284, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.8207934336525308, "eval_overall_precision": 0.7633587786259542, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3345, "eval_samples_per_second": 559.005, "eval_steps_per_second": 8.968, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.7791297435760498, "learning_rate": 3.05e-05, "loss": 0.0545, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6929133858267716, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6376811594202898, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.15971286594867706, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.8302945301542777, "eval_overall_precision": 0.7893333333333333, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3358, "eval_samples_per_second": 556.857, "eval_steps_per_second": 8.934, "step": 4134 }, { "epoch": 40.0, "grad_norm": 1.3748724460601807, "learning_rate": 3e-05, "loss": 0.0522, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7166666666666668, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6935483870967742, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.8059701492537312, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.15032222867012024, "eval_overall_accuracy": 0.9626120358514725, "eval_overall_f1": 0.8366197183098592, "eval_overall_precision": 0.7983870967741935, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3322, "eval_samples_per_second": 562.995, "eval_steps_per_second": 9.032, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.5511608719825745, "learning_rate": 2.95e-05, "loss": 0.0484, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6984126984126984, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7540983606557378, "eval_TIME_number": 29, "eval_TIME_precision": 0.71875, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.16514161229133606, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8263305322128851, "eval_overall_precision": 0.7845744680851063, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3352, "eval_samples_per_second": 557.858, "eval_steps_per_second": 8.95, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.6805091500282288, "learning_rate": 2.9e-05, "loss": 0.0472, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8671328671328672, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6984126984126984, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.9096774193548387, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.16605274379253387, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8321579689703809, "eval_overall_precision": 0.7951482479784366, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3329, "eval_samples_per_second": 561.686, "eval_steps_per_second": 9.011, "step": 4452 }, { "epoch": 43.0, "grad_norm": 3.199406147003174, "learning_rate": 2.8499999999999998e-05, "loss": 0.0498, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7040000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6567164179104478, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.9067524115755626, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.8059701492537312, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.155135378241539, "eval_overall_accuracy": 0.9628681177976952, "eval_overall_f1": 0.8422535211267606, "eval_overall_precision": 0.803763440860215, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.3322, "eval_samples_per_second": 562.861, "eval_steps_per_second": 9.03, "step": 4558 }, { "epoch": 44.0, "grad_norm": 1.2136147022247314, "learning_rate": 2.8000000000000003e-05, "loss": 0.0474, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7154471544715447, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.676923076923077, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8867924528301887, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1694120317697525, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8314606741573034, "eval_overall_precision": 0.7914438502673797, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3337, "eval_samples_per_second": 560.411, "eval_steps_per_second": 8.991, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.1127651929855347, "learning_rate": 2.7500000000000004e-05, "loss": 0.0483, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6929133858267716, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6376811594202898, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.6388888888888888, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5476190476190477, "eval_QUANTITY_recall": 0.7666666666666667, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.17468813061714172, "eval_overall_accuracy": 0.954673495518566, "eval_overall_f1": 0.8138888888888889, "eval_overall_precision": 0.7670157068062827, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.3348, "eval_samples_per_second": 558.469, "eval_steps_per_second": 8.959, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.21913494169712067, "learning_rate": 2.7000000000000002e-05, "loss": 0.045, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6942148760330579, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7272727272727273, "eval_TIME_number": 29, "eval_TIME_precision": 0.6486486486486487, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1735159456729889, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8200836820083682, "eval_overall_precision": 0.7757255936675461, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3358, "eval_samples_per_second": 556.961, "eval_steps_per_second": 8.935, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.8087287545204163, "learning_rate": 2.6500000000000004e-05, "loss": 0.0431, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6829268292682927, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6461538461538462, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8860759493670887, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7164179104477612, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.17915095388889313, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8207282913165266, "eval_overall_precision": 0.7792553191489362, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.3356, "eval_samples_per_second": 557.259, "eval_steps_per_second": 8.94, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.3942605257034302, "learning_rate": 2.6000000000000002e-05, "loss": 0.0424, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7419354838709677, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.696969696969697, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8924050632911392, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1734819859266281, "eval_overall_accuracy": 0.9605633802816902, "eval_overall_f1": 0.8340306834030683, "eval_overall_precision": 0.7889182058047494, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.335, "eval_samples_per_second": 558.27, "eval_steps_per_second": 8.956, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.8996381759643555, "learning_rate": 2.5500000000000003e-05, "loss": 0.0426, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7441860465116279, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.676056338028169, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8867924528301887, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.17559018731117249, "eval_overall_accuracy": 0.9597951344430218, "eval_overall_f1": 0.8381742738589212, "eval_overall_precision": 0.787012987012987, "eval_overall_recall": 0.8964497041420119, "eval_runtime": 0.3329, "eval_samples_per_second": 561.775, "eval_steps_per_second": 9.012, "step": 5194 }, { "epoch": 50.0, "grad_norm": 0.22222945094108582, "learning_rate": 2.5e-05, "loss": 0.0412, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6548672566371682, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6727272727272727, "eval_ORGANIZATION_recall": 0.6379310344827587, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.16795222461223602, "eval_overall_accuracy": 0.9597951344430218, "eval_overall_f1": 0.8295454545454545, "eval_overall_precision": 0.7978142076502732, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.3341, "eval_samples_per_second": 559.727, "eval_steps_per_second": 8.98, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.7834493517875671, "learning_rate": 2.45e-05, "loss": 0.0407, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6557377049180328, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.6896551724137931, "eval_PERSON_f1": 0.9015873015873016, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.17565281689167023, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8286516853932584, "eval_overall_precision": 0.7887700534759359, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3349, "eval_samples_per_second": 558.379, "eval_steps_per_second": 8.958, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.5259361863136292, "learning_rate": 2.4e-05, "loss": 0.0421, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7142857142857142, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6617647058823529, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.18448342382907867, "eval_overall_accuracy": 0.9587708066581306, "eval_overall_f1": 0.83008356545961, "eval_overall_precision": 0.7842105263157895, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3359, "eval_samples_per_second": 556.686, "eval_steps_per_second": 8.931, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.3698176145553589, "learning_rate": 2.35e-05, "loss": 0.0415, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7142857142857142, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6617647058823529, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.180740624666214, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8379888268156425, "eval_overall_precision": 0.7936507936507936, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3346, "eval_samples_per_second": 558.915, "eval_steps_per_second": 8.967, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.6899826526641846, "learning_rate": 2.3000000000000003e-05, "loss": 0.0378, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6615384615384615, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5972222222222222, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.8059701492537312, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1903461366891861, "eval_overall_accuracy": 0.9587708066581306, "eval_overall_f1": 0.8250000000000001, "eval_overall_precision": 0.7774869109947644, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3444, "eval_samples_per_second": 542.946, "eval_steps_per_second": 8.71, "step": 5724 }, { "epoch": 55.0, "grad_norm": 1.0006171464920044, "learning_rate": 2.25e-05, "loss": 0.0388, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7166666666666668, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6935483870967742, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8980891719745223, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7164179104477612, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.18361018598079681, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.8326300984528833, "eval_overall_precision": 0.7935656836461126, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3373, "eval_samples_per_second": 554.414, "eval_steps_per_second": 8.894, "step": 5830 }, { "epoch": 56.0, "grad_norm": 0.8649386167526245, "learning_rate": 2.2000000000000003e-05, "loss": 0.0381, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7647058823529413, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.17993959784507751, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8382559774964837, "eval_overall_precision": 0.7989276139410187, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3352, "eval_samples_per_second": 557.898, "eval_steps_per_second": 8.95, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.5134249925613403, "learning_rate": 2.15e-05, "loss": 0.0377, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6451612903225807, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6060606060606061, "eval_ORGANIZATION_recall": 0.6896551724137931, "eval_PERSON_f1": 0.8797468354430381, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.7692307692307692, "eval_TIME_number": 29, "eval_TIME_precision": 0.6944444444444444, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1980062872171402, "eval_overall_accuracy": 0.9554417413572344, "eval_overall_f1": 0.8189415041782729, "eval_overall_precision": 0.7736842105263158, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3364, "eval_samples_per_second": 555.829, "eval_steps_per_second": 8.917, "step": 6042 }, { "epoch": 58.0, "grad_norm": 1.7326457500457764, "learning_rate": 2.1e-05, "loss": 0.0382, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8671328671328672, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8378378378378378, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8980891719745223, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1960817277431488, "eval_overall_accuracy": 0.9562099871959027, "eval_overall_f1": 0.8274894810659188, "eval_overall_precision": 0.7866666666666666, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3347, "eval_samples_per_second": 558.716, "eval_steps_per_second": 8.963, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.785622239112854, "learning_rate": 2.05e-05, "loss": 0.0358, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6984126984126984, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8952380952380953, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1875164657831192, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.835195530726257, "eval_overall_precision": 0.791005291005291, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.3334, "eval_samples_per_second": 560.851, "eval_steps_per_second": 8.998, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.8723583221435547, "learning_rate": 2e-05, "loss": 0.0355, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.703125, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8938906752411576, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7164179104477612, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.19338777661323547, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8314606741573034, "eval_overall_precision": 0.7914438502673797, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3431, "eval_samples_per_second": 544.973, "eval_steps_per_second": 8.743, "step": 6360 }, { "epoch": 61.0, "grad_norm": 1.1464908123016357, "learning_rate": 1.9500000000000003e-05, "loss": 0.037, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6929133858267716, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6376811594202898, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7647058823529413, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.18568746745586395, "eval_overall_accuracy": 0.9592829705505762, "eval_overall_f1": 0.829608938547486, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3342, "eval_samples_per_second": 559.582, "eval_steps_per_second": 8.977, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.577111542224884, "learning_rate": 1.9e-05, "loss": 0.0342, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.671875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6142857142857143, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.19420312345027924, "eval_overall_accuracy": 0.9564660691421255, "eval_overall_f1": 0.8184357541899442, "eval_overall_precision": 0.7751322751322751, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.3361, "eval_samples_per_second": 556.377, "eval_steps_per_second": 8.926, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.4379956126213074, "learning_rate": 1.85e-05, "loss": 0.0349, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.888888888888889, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8533333333333334, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6942148760330579, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8924050632911392, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.8059701492537312, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 29, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.18639543652534485, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8450704225352114, "eval_overall_precision": 0.8064516129032258, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.339, "eval_samples_per_second": 551.625, "eval_steps_per_second": 8.85, "step": 6678 }, { "epoch": 64.0, "grad_norm": 1.331531286239624, "learning_rate": 1.8e-05, "loss": 0.0316, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6814814814814815, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5974025974025974, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7647058823529413, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.19557389616966248, "eval_overall_accuracy": 0.9554417413572344, "eval_overall_f1": 0.8209366391184573, "eval_overall_precision": 0.7680412371134021, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3402, "eval_samples_per_second": 549.599, "eval_steps_per_second": 8.817, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.3099250793457031, "learning_rate": 1.75e-05, "loss": 0.0358, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6808510638297872, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5783132530120482, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.9015873015873016, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.19938279688358307, "eval_overall_accuracy": 0.9567221510883482, "eval_overall_f1": 0.8290013679890562, "eval_overall_precision": 0.7709923664122137, "eval_overall_recall": 0.8964497041420119, "eval_runtime": 0.3388, "eval_samples_per_second": 551.909, "eval_steps_per_second": 8.854, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.5862748026847839, "learning_rate": 1.7000000000000003e-05, "loss": 0.0317, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6559999999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6119402985074627, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.8952380952380953, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.21487130224704742, "eval_overall_accuracy": 0.9556978233034571, "eval_overall_f1": 0.8200836820083682, "eval_overall_precision": 0.7757255936675461, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3359, "eval_samples_per_second": 556.74, "eval_steps_per_second": 8.932, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.5351269841194153, "learning_rate": 1.65e-05, "loss": 0.0335, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7040000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6567164179104478, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.9079365079365079, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8773006134969326, "eval_PERSON_recall": 0.9407894736842105, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1979534924030304, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8391608391608392, "eval_overall_precision": 0.7957559681697612, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3372, "eval_samples_per_second": 554.49, "eval_steps_per_second": 8.896, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.3918878138065338, "learning_rate": 1.6000000000000003e-05, "loss": 0.0333, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.889589905362776, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7384615384615385, "eval_TIME_number": 29, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1945626586675644, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8222222222222222, "eval_overall_precision": 0.774869109947644, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3368, "eval_samples_per_second": 555.197, "eval_steps_per_second": 8.907, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.9337367415428162, "learning_rate": 1.55e-05, "loss": 0.0311, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6991869918699186, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6615384615384615, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 29, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.19715982675552368, "eval_overall_accuracy": 0.9605633802816902, "eval_overall_f1": 0.8470254957507082, "eval_overall_precision": 0.8125, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.3336, "eval_samples_per_second": 560.63, "eval_steps_per_second": 8.994, "step": 7314 }, { "epoch": 70.0, "grad_norm": 1.763173222541809, "learning_rate": 1.5e-05, "loss": 0.0314, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7049180327868853, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.671875, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8980891719745223, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.2073572725057602, "eval_overall_accuracy": 0.9572343149807938, "eval_overall_f1": 0.8342696629213484, "eval_overall_precision": 0.7941176470588235, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3343, "eval_samples_per_second": 559.3, "eval_steps_per_second": 8.973, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.9943879842758179, "learning_rate": 1.45e-05, "loss": 0.0317, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.9044585987261147, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8765432098765432, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7272727272727273, "eval_TIME_number": 29, "eval_TIME_precision": 0.6486486486486487, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.21239928901195526, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8344923504867873, "eval_overall_precision": 0.7874015748031497, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3359, "eval_samples_per_second": 556.631, "eval_steps_per_second": 8.93, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.39654669165611267, "learning_rate": 1.4000000000000001e-05, "loss": 0.0297, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.881118881118881, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8513513513513513, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6379310344827587, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6379310344827587, "eval_ORGANIZATION_recall": 0.6379310344827587, "eval_PERSON_f1": 0.9009584664536742, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.2062947303056717, "eval_overall_accuracy": 0.9567221510883482, "eval_overall_f1": 0.8233618233618234, "eval_overall_precision": 0.7939560439560439, "eval_overall_recall": 0.8550295857988166, "eval_runtime": 0.3343, "eval_samples_per_second": 559.346, "eval_steps_per_second": 8.973, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.2321532964706421, "learning_rate": 1.3500000000000001e-05, "loss": 0.0293, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6825396825396826, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6323529411764706, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.9015873015873016, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9342105263157895, "eval_QUANTITY_f1": 0.8059701492537312, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.9, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 29, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.20541173219680786, "eval_overall_accuracy": 0.9603072983354674, "eval_overall_f1": 0.8435754189944134, "eval_overall_precision": 0.798941798941799, "eval_overall_recall": 0.893491124260355, "eval_runtime": 0.3355, "eval_samples_per_second": 557.322, "eval_steps_per_second": 8.941, "step": 7738 }, { "epoch": 74.0, "grad_norm": 2.329578399658203, "learning_rate": 1.3000000000000001e-05, "loss": 0.0303, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6666666666666667, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6176470588235294, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8980891719745223, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 29, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.20924483239650726, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.8240223463687152, "eval_overall_precision": 0.7804232804232805, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3356, "eval_samples_per_second": 557.229, "eval_steps_per_second": 8.939, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.4096578359603882, "learning_rate": 1.25e-05, "loss": 0.0319, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6829268292682927, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6461538461538462, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7384615384615385, "eval_TIME_number": 29, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.21165302395820618, "eval_overall_accuracy": 0.9567221510883482, "eval_overall_f1": 0.8230337078651686, "eval_overall_precision": 0.7834224598930482, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.3352, "eval_samples_per_second": 557.866, "eval_steps_per_second": 8.95, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.22333945333957672, "learning_rate": 1.2e-05, "loss": 0.0294, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6829268292682927, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6461538461538462, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8974358974358975, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.75, "eval_TIME_number": 29, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.20302210748195648, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8258426966292135, "eval_overall_precision": 0.786096256684492, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3339, "eval_samples_per_second": 560.02, "eval_steps_per_second": 8.984, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.893441915512085, "learning_rate": 1.1500000000000002e-05, "loss": 0.0282, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6721311475409836, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.640625, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7936507936507937, "eval_TIME_number": 29, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.20604942739009857, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.829817158931083, "eval_overall_precision": 0.7908847184986595, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3381, "eval_samples_per_second": 553.156, "eval_steps_per_second": 8.874, "step": 8162 }, { "epoch": 78.0, "grad_norm": 1.8298670053482056, "learning_rate": 1.1000000000000001e-05, "loss": 0.0298, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6610169491525424, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.6724137931034483, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.20402812957763672, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8238636363636365, "eval_overall_precision": 0.7923497267759563, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.3363, "eval_samples_per_second": 556.081, "eval_steps_per_second": 8.921, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.38677918910980225, "learning_rate": 1.05e-05, "loss": 0.0296, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6991869918699186, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6615384615384615, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.9009584664536742, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 29, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1978691667318344, "eval_overall_accuracy": 0.9608194622279129, "eval_overall_f1": 0.8474576271186441, "eval_overall_precision": 0.8108108108108109, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.3358, "eval_samples_per_second": 556.894, "eval_steps_per_second": 8.934, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.18261797726154327, "learning_rate": 1e-05, "loss": 0.0281, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7107438016528926, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6825396825396826, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2115841805934906, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8389830508474576, "eval_overall_precision": 0.8027027027027027, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3347, "eval_samples_per_second": 558.764, "eval_steps_per_second": 8.964, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.5827004909515381, "learning_rate": 9.5e-06, "loss": 0.0285, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6721311475409836, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.640625, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7692307692307692, "eval_TIME_number": 29, "eval_TIME_precision": 0.6944444444444444, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.20784814655780792, "eval_overall_accuracy": 0.9569782330345711, "eval_overall_f1": 0.8258426966292135, "eval_overall_precision": 0.786096256684492, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3341, "eval_samples_per_second": 559.746, "eval_steps_per_second": 8.98, "step": 8586 }, { "epoch": 82.0, "grad_norm": 0.163285493850708, "learning_rate": 9e-06, "loss": 0.0248, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6612903225806452, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6212121212121212, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7352941176470588, "eval_TIME_number": 29, "eval_TIME_precision": 0.6410256410256411, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.22002604603767395, "eval_overall_accuracy": 0.9541613316261204, "eval_overall_f1": 0.8200836820083682, "eval_overall_precision": 0.7757255936675461, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.3337, "eval_samples_per_second": 560.445, "eval_steps_per_second": 8.991, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.5999857783317566, "learning_rate": 8.500000000000002e-06, "loss": 0.026, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.888888888888889, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8533333333333334, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6666666666666667, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6451612903225806, "eval_ORGANIZATION_recall": 0.6896551724137931, "eval_PERSON_f1": 0.8974358974358975, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 29, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.20526228845119476, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.8404558404558404, "eval_overall_precision": 0.8104395604395604, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.3329, "eval_samples_per_second": 561.768, "eval_steps_per_second": 9.012, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.8914698362350464, "learning_rate": 8.000000000000001e-06, "loss": 0.0267, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6829268292682927, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6461538461538462, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8980891719745223, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.9276315789473685, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7222222222222222, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.20852600038051605, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8359046283309958, "eval_overall_precision": 0.7946666666666666, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3353, "eval_samples_per_second": 557.656, "eval_steps_per_second": 8.946, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.07933935523033142, "learning_rate": 7.5e-06, "loss": 0.0256, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6774193548387097, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7222222222222222, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21233612298965454, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.8335664335664336, "eval_overall_precision": 0.7904509283819628, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3363, "eval_samples_per_second": 556.087, "eval_steps_per_second": 8.921, "step": 9010 }, { "epoch": 86.0, "grad_norm": 1.2923147678375244, "learning_rate": 7.000000000000001e-06, "loss": 0.0258, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6774193548387096, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7692307692307692, "eval_TIME_number": 29, "eval_TIME_precision": 0.6944444444444444, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.20847661793231964, "eval_overall_accuracy": 0.9572343149807938, "eval_overall_f1": 0.8338028169014083, "eval_overall_precision": 0.7956989247311828, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3331, "eval_samples_per_second": 561.331, "eval_steps_per_second": 9.005, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.8602144718170166, "learning_rate": 6.5000000000000004e-06, "loss": 0.0278, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6984126984126984, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7575757575757576, "eval_TIME_number": 29, "eval_TIME_precision": 0.6756756756756757, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.2143712192773819, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.829608938547486, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3343, "eval_samples_per_second": 559.33, "eval_steps_per_second": 8.973, "step": 9222 }, { "epoch": 88.0, "grad_norm": 3.9535341262817383, "learning_rate": 6e-06, "loss": 0.0266, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.672, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6268656716417911, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21172450482845306, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8314606741573034, "eval_overall_precision": 0.7914438502673797, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.3355, "eval_samples_per_second": 557.315, "eval_steps_per_second": 8.941, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.6084784865379333, "learning_rate": 5.500000000000001e-06, "loss": 0.0277, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6774193548387097, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7222222222222222, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21649378538131714, "eval_overall_accuracy": 0.9574903969270167, "eval_overall_f1": 0.8335664335664336, "eval_overall_precision": 0.7904509283819628, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3329, "eval_samples_per_second": 561.77, "eval_steps_per_second": 9.012, "step": 9434 }, { "epoch": 90.0, "grad_norm": 3.59494686126709, "learning_rate": 5e-06, "loss": 0.0263, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6935483870967741, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6515151515151515, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7692307692307692, "eval_TIME_number": 29, "eval_TIME_precision": 0.6944444444444444, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.21574969589710236, "eval_overall_accuracy": 0.9572343149807938, "eval_overall_f1": 0.8284518828451882, "eval_overall_precision": 0.783641160949868, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.336, "eval_samples_per_second": 556.623, "eval_steps_per_second": 8.93, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.6815735697746277, "learning_rate": 4.5e-06, "loss": 0.0249, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6666666666666666, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6307692307692307, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.89171974522293, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21547271311283112, "eval_overall_accuracy": 0.9574903969270167, "eval_overall_f1": 0.8342696629213484, "eval_overall_precision": 0.7941176470588235, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3337, "eval_samples_per_second": 560.443, "eval_steps_per_second": 8.991, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.9203242063522339, "learning_rate": 4.000000000000001e-06, "loss": 0.026, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8689655172413793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8289473684210527, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21566654741764069, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8342696629213484, "eval_overall_precision": 0.7941176470588235, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3342, "eval_samples_per_second": 559.523, "eval_steps_per_second": 8.976, "step": 9752 }, { "epoch": 93.0, "grad_norm": 1.3422565460205078, "learning_rate": 3.5000000000000004e-06, "loss": 0.0246, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6935483870967741, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6515151515151515, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21777355670928955, "eval_overall_accuracy": 0.9574903969270167, "eval_overall_f1": 0.8319327731092437, "eval_overall_precision": 0.7898936170212766, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3325, "eval_samples_per_second": 562.463, "eval_steps_per_second": 9.023, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.5304462909698486, "learning_rate": 3e-06, "loss": 0.0228, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6666666666666667, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6056338028169014, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21389849483966827, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.83008356545961, "eval_overall_precision": 0.7842105263157895, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3334, "eval_samples_per_second": 560.952, "eval_steps_per_second": 8.999, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.9430941343307495, "learning_rate": 2.5e-06, "loss": 0.0239, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2171957641839981, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8359046283309958, "eval_overall_precision": 0.7946666666666666, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3342, "eval_samples_per_second": 559.517, "eval_steps_per_second": 8.976, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.5671630501747131, "learning_rate": 2.0000000000000003e-06, "loss": 0.0246, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6771653543307088, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6231884057971014, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21604588627815247, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.835195530726257, "eval_overall_precision": 0.791005291005291, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.3336, "eval_samples_per_second": 560.484, "eval_steps_per_second": 8.992, "step": 10176 }, { "epoch": 97.0, "grad_norm": 2.1864192485809326, "learning_rate": 1.5e-06, "loss": 0.0263, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.888888888888889, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8533333333333334, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6829268292682927, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6461538461538462, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2144096940755844, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8389830508474576, "eval_overall_precision": 0.8027027027027027, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.3344, "eval_samples_per_second": 559.208, "eval_steps_per_second": 8.971, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.35259944200515747, "learning_rate": 1.0000000000000002e-06, "loss": 0.0243, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.688, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6417910447761194, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21475861966609955, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.8370786516853933, "eval_overall_precision": 0.7967914438502673, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.3334, "eval_samples_per_second": 560.934, "eval_steps_per_second": 8.999, "step": 10388 }, { "epoch": 99.0, "grad_norm": 1.3611903190612793, "learning_rate": 5.000000000000001e-07, "loss": 0.0232, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6935483870967741, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6515151515151515, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.2144315391778946, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8382559774964837, "eval_overall_precision": 0.7989276139410187, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.334, "eval_samples_per_second": 559.885, "eval_steps_per_second": 8.982, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.2549450397491455, "learning_rate": 0.0, "loss": 0.0224, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6935483870967741, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6515151515151515, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8945686900958467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8125, "eval_TIME_number": 29, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.21471820771694183, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8382559774964837, "eval_overall_precision": 0.7989276139410187, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.336, "eval_samples_per_second": 556.48, "eval_steps_per_second": 8.927, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5008141811675874.0, "train_loss": 0.0706503679617396, "train_runtime": 608.9849, "train_samples_per_second": 277.018, "train_steps_per_second": 17.406 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5008141811675874.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }