{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.502664804458618, "learning_rate": 4.9500000000000004e-05, "loss": 0.9512, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.013071895424836602, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.3333333333333333, "eval_PERSON_recall": 0.006666666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 28, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.6040259599685669, "eval_overall_accuracy": 0.8411736178467507, "eval_overall_f1": 0.005714285714285714, "eval_overall_precision": 0.3333333333333333, "eval_overall_recall": 0.002881844380403458, "eval_runtime": 0.4042, "eval_samples_per_second": 462.684, "eval_steps_per_second": 7.423, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.1181972026824951, "learning_rate": 4.9e-05, "loss": 0.5021, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.467741935483871, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5471698113207547, "eval_LOCATION_recall": 0.4084507042253521, "eval_ORGANIZATION_f1": 0.203125, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.20634920634920634, "eval_ORGANIZATION_recall": 0.2, "eval_PERSON_f1": 0.6997084548104956, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.6217616580310881, "eval_PERSON_recall": 0.8, "eval_QUANTITY_f1": 0.1904761904761905, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.2, "eval_QUANTITY_recall": 0.18181818181818182, "eval_TIME_f1": 0.49180327868852464, "eval_TIME_number": 28, "eval_TIME_precision": 0.45454545454545453, "eval_TIME_recall": 0.5357142857142857, "eval_loss": 0.3378148674964905, "eval_overall_accuracy": 0.9076139670223085, "eval_overall_f1": 0.5090403337969402, "eval_overall_precision": 0.49193548387096775, "eval_overall_recall": 0.5273775216138329, "eval_runtime": 0.4075, "eval_samples_per_second": 458.866, "eval_steps_per_second": 7.361, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.0774222612380981, "learning_rate": 4.85e-05, "loss": 0.2912, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.6289308176100629, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5681818181818182, "eval_LOCATION_recall": 0.704225352112676, "eval_ORGANIZATION_f1": 0.5970149253731344, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5797101449275363, "eval_ORGANIZATION_recall": 0.6153846153846154, "eval_PERSON_f1": 0.8291139240506329, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7891566265060241, "eval_PERSON_recall": 0.8733333333333333, "eval_QUANTITY_f1": 0.5405405405405406, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.4878048780487805, "eval_QUANTITY_recall": 0.6060606060606061, "eval_TIME_f1": 0.830188679245283, "eval_TIME_number": 28, "eval_TIME_precision": 0.88, "eval_TIME_recall": 0.7857142857142857, "eval_loss": 0.18643514811992645, "eval_overall_accuracy": 0.9376818622696411, "eval_overall_f1": 0.7146739130434783, "eval_overall_precision": 0.6760925449871465, "eval_overall_recall": 0.7579250720461095, "eval_runtime": 0.4093, "eval_samples_per_second": 456.848, "eval_steps_per_second": 7.329, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.0147018432617188, "learning_rate": 4.8e-05, "loss": 0.1943, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.7142857142857142, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6185567010309279, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6790123456790124, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5670103092783505, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.85625, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8058823529411765, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6829268292682927, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5714285714285714, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1579989790916443, "eval_overall_accuracy": 0.9478661493695442, "eval_overall_f1": 0.7715736040609138, "eval_overall_precision": 0.6893424036281179, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4082, "eval_samples_per_second": 458.117, "eval_steps_per_second": 7.349, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.6936546564102173, "learning_rate": 4.75e-05, "loss": 0.1653, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7228915662650601, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.631578947368421, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6712328767123288, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6049382716049383, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8626198083067093, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.9090909090909091, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13640257716178894, "eval_overall_accuracy": 0.9524733268671193, "eval_overall_f1": 0.7842105263157895, "eval_overall_precision": 0.7215496368038741, "eval_overall_recall": 0.8587896253602305, "eval_runtime": 0.4066, "eval_samples_per_second": 459.951, "eval_steps_per_second": 7.379, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.5403629541397095, "learning_rate": 4.7e-05, "loss": 0.152, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7272727272727273, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6382978723404256, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6666666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5567010309278351, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8553846153846154, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7942857142857143, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.6969696969696969, "eval_TIME_number": 28, "eval_TIME_precision": 0.6052631578947368, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.15786363184452057, "eval_overall_accuracy": 0.944713870029098, "eval_overall_f1": 0.7628607277289837, "eval_overall_precision": 0.6755555555555556, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.408, "eval_samples_per_second": 458.337, "eval_steps_per_second": 7.353, "step": 636 }, { "epoch": 7.0, "grad_norm": 2.2046146392822266, "learning_rate": 4.6500000000000005e-05, "loss": 0.1379, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7439024390243902, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6559139784946236, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7012987012987013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6067415730337079, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8553846153846154, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7942857142857143, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6341463414634148, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5306122448979592, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.7076923076923075, "eval_TIME_number": 28, "eval_TIME_precision": 0.6216216216216216, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.15319040417671204, "eval_overall_accuracy": 0.9464112512124151, "eval_overall_f1": 0.7670886075949368, "eval_overall_precision": 0.6839729119638827, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4079, "eval_samples_per_second": 458.417, "eval_steps_per_second": 7.354, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.8930031061172485, "learning_rate": 4.600000000000001e-05, "loss": 0.125, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7425149700598803, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6458333333333334, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.6962025316455697, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5913978494623656, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12710979580879211, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.7979139504563234, "eval_overall_precision": 0.7285714285714285, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4046, "eval_samples_per_second": 462.173, "eval_steps_per_second": 7.415, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.0148112773895264, "learning_rate": 4.55e-05, "loss": 0.1161, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7320261437908497, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6829268292682927, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.6707317073170732, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5555555555555556, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12680365145206451, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.793148880105402, "eval_overall_precision": 0.7305825242718447, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.4068, "eval_samples_per_second": 459.728, "eval_steps_per_second": 7.375, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.5242857933044434, "learning_rate": 4.5e-05, "loss": 0.1124, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7532467532467533, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6987951807228916, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7272727272727272, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8860759493670886, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8433734939759037, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12313192337751389, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8074866310160428, "eval_overall_precision": 0.7531172069825436, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.4064, "eval_samples_per_second": 460.091, "eval_steps_per_second": 7.381, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.9723674058914185, "learning_rate": 4.4500000000000004e-05, "loss": 0.1059, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7532467532467533, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6987951807228916, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7142857142857142, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1203012615442276, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8048780487804879, "eval_overall_precision": 0.7595907928388747, "eval_overall_recall": 0.8559077809798271, "eval_runtime": 0.4057, "eval_samples_per_second": 460.934, "eval_steps_per_second": 7.395, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.34227454662323, "learning_rate": 4.4000000000000006e-05, "loss": 0.0975, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7341772151898733, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6666666666666666, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.6956521739130436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5833333333333334, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.86875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8176470588235294, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.78125, "eval_TIME_number": 28, "eval_TIME_precision": 0.6944444444444444, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1370622217655182, "eval_overall_accuracy": 0.9527158098933075, "eval_overall_f1": 0.7906976744186047, "eval_overall_precision": 0.7166276346604216, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4061, "eval_samples_per_second": 460.527, "eval_steps_per_second": 7.388, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.8592511415481567, "learning_rate": 4.35e-05, "loss": 0.0915, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7199999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6352941176470588, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8952380952380952, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12159363925457001, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8225806451612904, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4059, "eval_samples_per_second": 460.692, "eval_steps_per_second": 7.391, "step": 1378 }, { "epoch": 14.0, "grad_norm": 3.151130437850952, "learning_rate": 4.3e-05, "loss": 0.0913, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8169014084507042, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7631578947368421, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.888888888888889, "eval_TIME_number": 28, "eval_TIME_precision": 0.9230769230769231, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.11676321178674698, "eval_overall_accuracy": 0.9629000969932104, "eval_overall_f1": 0.8335625859697388, "eval_overall_precision": 0.7973684210526316, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4073, "eval_samples_per_second": 459.097, "eval_steps_per_second": 7.365, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.3836969137191772, "learning_rate": 4.25e-05, "loss": 0.0853, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12170998007059097, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8241610738255033, "eval_overall_precision": 0.7713567839195979, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.412, "eval_samples_per_second": 453.856, "eval_steps_per_second": 7.281, "step": 1590 }, { "epoch": 16.0, "grad_norm": 1.1944974660873413, "learning_rate": 4.2e-05, "loss": 0.0809, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13052447140216827, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8180610889774237, "eval_overall_precision": 0.7586206896551724, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4077, "eval_samples_per_second": 458.719, "eval_steps_per_second": 7.359, "step": 1696 }, { "epoch": 17.0, "grad_norm": 1.1874595880508423, "learning_rate": 4.15e-05, "loss": 0.0773, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8980891719745222, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12760519981384277, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8148148148148148, "eval_overall_precision": 0.7530562347188264, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4077, "eval_samples_per_second": 458.725, "eval_steps_per_second": 7.359, "step": 1802 }, { "epoch": 18.0, "grad_norm": 1.0034806728363037, "learning_rate": 4.1e-05, "loss": 0.0737, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.7407407407407407, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6593406593406593, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6967741935483871, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.834319526627219, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7796610169491526, "eval_TIME_number": 28, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.15325599908828735, "eval_overall_accuracy": 0.9493210475266731, "eval_overall_f1": 0.7911802853437095, "eval_overall_precision": 0.7193396226415094, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4065, "eval_samples_per_second": 460.02, "eval_steps_per_second": 7.38, "step": 1908 }, { "epoch": 19.0, "grad_norm": 1.108689785003662, "learning_rate": 4.05e-05, "loss": 0.0703, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8990228013029316, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8789808917197452, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1193038821220398, "eval_overall_accuracy": 0.9631425800193987, "eval_overall_f1": 0.8290013679890561, "eval_overall_precision": 0.7890625, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.408, "eval_samples_per_second": 458.324, "eval_steps_per_second": 7.353, "step": 2014 }, { "epoch": 20.0, "grad_norm": 1.1755281686782837, "learning_rate": 4e-05, "loss": 0.0713, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7236842105263158, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.912621359223301, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.9259259259259259, "eval_TIME_number": 28, "eval_TIME_precision": 0.9615384615384616, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12470389902591705, "eval_overall_accuracy": 0.9624151309408342, "eval_overall_f1": 0.829530201342282, "eval_overall_precision": 0.7763819095477387, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.4074, "eval_samples_per_second": 458.981, "eval_steps_per_second": 7.363, "step": 2120 }, { "epoch": 21.0, "grad_norm": 1.2563973665237427, "learning_rate": 3.9500000000000005e-05, "loss": 0.0649, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5894736842105263, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13802851736545563, "eval_overall_accuracy": 0.95635305528613, "eval_overall_f1": 0.80946123521682, "eval_overall_precision": 0.7439613526570048, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4074, "eval_samples_per_second": 459.06, "eval_steps_per_second": 7.365, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.8472046852111816, "learning_rate": 3.9000000000000006e-05, "loss": 0.0645, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.75, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7037037037037037, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.738255033557047, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14445021748542786, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8221024258760108, "eval_overall_precision": 0.7721518987341772, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4092, "eval_samples_per_second": 456.965, "eval_steps_per_second": 7.331, "step": 2332 }, { "epoch": 23.0, "grad_norm": 1.0579193830490112, "learning_rate": 3.85e-05, "loss": 0.0595, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.759493670886076, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6896551724137931, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13738445937633514, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8284182305630027, "eval_overall_precision": 0.7744360902255639, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.4089, "eval_samples_per_second": 457.323, "eval_steps_per_second": 7.337, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.30304753780365, "learning_rate": 3.8e-05, "loss": 0.0576, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7172413793103448, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8000000000000002, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7567567567567568, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14021030068397522, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8276797829036635, "eval_overall_precision": 0.782051282051282, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.408, "eval_samples_per_second": 458.303, "eval_steps_per_second": 7.352, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.7619758248329163, "learning_rate": 3.7500000000000003e-05, "loss": 0.0562, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.708860759493671, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6021505376344086, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15844029188156128, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.80946123521682, "eval_overall_precision": 0.7439613526570048, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4076, "eval_samples_per_second": 458.809, "eval_steps_per_second": 7.361, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.3145362138748169, "learning_rate": 3.7e-05, "loss": 0.0533, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.7466666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7088607594936709, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7248322147651007, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6842105263157895, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6046511627906976, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1501431167125702, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.8058902275769746, "eval_overall_precision": 0.7525, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.4072, "eval_samples_per_second": 459.248, "eval_steps_per_second": 7.368, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.4819648265838623, "learning_rate": 3.65e-05, "loss": 0.0529, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15187156200408936, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8229027962716378, "eval_overall_precision": 0.7648514851485149, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.4068, "eval_samples_per_second": 459.716, "eval_steps_per_second": 7.375, "step": 2862 }, { "epoch": 28.0, "grad_norm": 0.8129953145980835, "learning_rate": 3.6e-05, "loss": 0.0531, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7605633802816901, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13637924194335938, "eval_overall_accuracy": 0.9641125121241513, "eval_overall_f1": 0.8372093023255814, "eval_overall_precision": 0.796875, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.406, "eval_samples_per_second": 460.578, "eval_steps_per_second": 7.389, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.46542084217071533, "learning_rate": 3.55e-05, "loss": 0.0463, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.7702702702702703, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7402597402597403, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6551724137931034, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9038461538461539, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8405797101449276, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.8055555555555556, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13960041105747223, "eval_overall_accuracy": 0.9624151309408342, "eval_overall_f1": 0.835820895522388, "eval_overall_precision": 0.7897435897435897, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4068, "eval_samples_per_second": 459.668, "eval_steps_per_second": 7.374, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.8071898818016052, "learning_rate": 3.5e-05, "loss": 0.0466, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1534765511751175, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.824631860776439, "eval_overall_precision": 0.77, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4052, "eval_samples_per_second": 461.503, "eval_steps_per_second": 7.404, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.7920342087745667, "learning_rate": 3.45e-05, "loss": 0.0449, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7093023255813954, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9102564102564102, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8765432098765432, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16083230078220367, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.4039, "eval_samples_per_second": 462.994, "eval_steps_per_second": 7.428, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.9836466908454895, "learning_rate": 3.4000000000000007e-05, "loss": 0.043, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.751592356687898, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.686046511627907, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9102564102564102, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8765432098765432, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.6933333333333334, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6190476190476191, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16350191831588745, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8095238095238096, "eval_overall_precision": 0.7481662591687042, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4041, "eval_samples_per_second": 462.793, "eval_steps_per_second": 7.424, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.8012641668319702, "learning_rate": 3.35e-05, "loss": 0.0394, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.7755102040816326, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.654320987654321, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9220779220779222, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8987341772151899, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.8285714285714285, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7837837837837838, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15030378103256226, "eval_overall_accuracy": 0.9641125121241513, "eval_overall_f1": 0.8402203856749312, "eval_overall_precision": 0.8047493403693932, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4047, "eval_samples_per_second": 462.071, "eval_steps_per_second": 7.413, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.9052590727806091, "learning_rate": 3.3e-05, "loss": 0.0412, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.7972972972972973, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7662337662337663, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7755102040816327, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6951219512195121, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9220779220779222, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8987341772151899, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1466250866651535, "eval_overall_accuracy": 0.9645974781765276, "eval_overall_f1": 0.8481532147742818, "eval_overall_precision": 0.8072916666666666, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.4032, "eval_samples_per_second": 463.733, "eval_steps_per_second": 7.44, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.42126646637916565, "learning_rate": 3.2500000000000004e-05, "loss": 0.0403, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9102564102564102, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8765432098765432, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15250608325004578, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8268456375838926, "eval_overall_precision": 0.7738693467336684, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4038, "eval_samples_per_second": 463.06, "eval_steps_per_second": 7.429, "step": 3710 }, { "epoch": 36.0, "grad_norm": 1.7094526290893555, "learning_rate": 3.2000000000000005e-05, "loss": 0.0385, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7354838709677419, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6333333333333333, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8958990536277603, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8502994011976048, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1817101240158081, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8233731739707836, "eval_overall_precision": 0.7635467980295566, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.4033, "eval_samples_per_second": 463.63, "eval_steps_per_second": 7.438, "step": 3816 }, { "epoch": 37.0, "grad_norm": 1.976254940032959, "learning_rate": 3.15e-05, "loss": 0.037, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.7435897435897436, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6823529411764706, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7152317880794703, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.627906976744186, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.89937106918239, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8511904761904762, "eval_PERSON_recall": 0.9533333333333334, "eval_QUANTITY_f1": 0.6582278481012658, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5652173913043478, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2011863738298416, "eval_overall_accuracy": 0.9517458777885548, "eval_overall_f1": 0.799475753604194, "eval_overall_precision": 0.7331730769230769, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4048, "eval_samples_per_second": 461.918, "eval_steps_per_second": 7.41, "step": 3922 }, { "epoch": 38.0, "grad_norm": 1.1307073831558228, "learning_rate": 3.1e-05, "loss": 0.037, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7681159420289856, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.726027397260274, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.9259259259259259, "eval_TIME_number": 28, "eval_TIME_precision": 0.9615384615384616, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1582067906856537, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8381742738589211, "eval_overall_precision": 0.8058510638297872, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4045, "eval_samples_per_second": 462.274, "eval_steps_per_second": 7.416, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.8394156694412231, "learning_rate": 3.05e-05, "loss": 0.0332, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.76, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6705882352941176, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9108280254777071, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8719512195121951, "eval_PERSON_recall": 0.9533333333333334, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16989700496196747, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8360215053763441, "eval_overall_precision": 0.783375314861461, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.4173, "eval_samples_per_second": 448.072, "eval_steps_per_second": 7.188, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.8886793255805969, "learning_rate": 3e-05, "loss": 0.0354, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9073482428115016, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 28, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1586233377456665, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8274932614555257, "eval_overall_precision": 0.7772151898734178, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.4013, "eval_samples_per_second": 465.977, "eval_steps_per_second": 7.476, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.6773855686187744, "learning_rate": 2.95e-05, "loss": 0.0331, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9025974025974027, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.879746835443038, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16328278183937073, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8286099865047233, "eval_overall_precision": 0.7791878172588832, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.4108, "eval_samples_per_second": 455.24, "eval_steps_per_second": 7.303, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.5810602903366089, "learning_rate": 2.9e-05, "loss": 0.0312, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9009584664536742, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7123287671232875, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1705748438835144, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.824966078697422, "eval_overall_precision": 0.7794871794871795, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4042, "eval_samples_per_second": 462.62, "eval_steps_per_second": 7.422, "step": 4452 }, { "epoch": 43.0, "grad_norm": 1.03245210647583, "learning_rate": 2.8499999999999998e-05, "loss": 0.031, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7482014388489208, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7027027027027027, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.9073482428115016, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.821917808219178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.9090909090909091, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16453760862350464, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8362652232746954, "eval_overall_precision": 0.7882653061224489, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.4028, "eval_samples_per_second": 464.207, "eval_steps_per_second": 7.447, "step": 4558 }, { "epoch": 44.0, "grad_norm": 1.3175857067108154, "learning_rate": 2.8000000000000003e-05, "loss": 0.0305, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7549668874172185, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6627906976744186, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9044585987261147, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8658536585365854, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1853325217962265, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8326639892904953, "eval_overall_precision": 0.7775, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.4048, "eval_samples_per_second": 462.013, "eval_steps_per_second": 7.412, "step": 4664 }, { "epoch": 45.0, "grad_norm": 2.4794533252716064, "learning_rate": 2.7500000000000004e-05, "loss": 0.0284, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.757142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7066666666666667, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9025974025974027, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.879746835443038, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16584299504756927, "eval_overall_accuracy": 0.9633850630455868, "eval_overall_f1": 0.8308115543328748, "eval_overall_precision": 0.7947368421052632, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.4049, "eval_samples_per_second": 461.854, "eval_steps_per_second": 7.409, "step": 4770 }, { "epoch": 46.0, "grad_norm": 1.2760629653930664, "learning_rate": 2.7000000000000002e-05, "loss": 0.028, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.7581699346405228, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7073170731707317, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7210884353741497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6463414634146342, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.912621359223301, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17332231998443604, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8238482384823849, "eval_overall_precision": 0.7774936061381074, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4033, "eval_samples_per_second": 463.665, "eval_steps_per_second": 7.438, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.9426093101501465, "learning_rate": 2.6500000000000004e-05, "loss": 0.0257, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7368421052631579, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6436781609195402, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9073482428115016, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8711656441717791, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18327540159225464, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.834008097165992, "eval_overall_precision": 0.7842639593908629, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.4078, "eval_samples_per_second": 458.511, "eval_steps_per_second": 7.356, "step": 4982 }, { "epoch": 48.0, "grad_norm": 0.6249455213546753, "learning_rate": 2.6000000000000002e-05, "loss": 0.0281, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7310344827586207, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6625, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8518518518518519, "eval_TIME_number": 28, "eval_TIME_precision": 0.8846153846153846, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.17024332284927368, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.823529411764706, "eval_overall_precision": 0.7838541666666666, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.4064, "eval_samples_per_second": 460.192, "eval_steps_per_second": 7.383, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.06978233903646469, "learning_rate": 2.5500000000000003e-05, "loss": 0.0245, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9131832797427653, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8819875776397516, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18626831471920013, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8279569892473119, "eval_overall_precision": 0.7758186397984886, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4028, "eval_samples_per_second": 464.25, "eval_steps_per_second": 7.448, "step": 5194 }, { "epoch": 50.0, "grad_norm": 2.4998741149902344, "learning_rate": 2.5e-05, "loss": 0.0251, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7536231884057971, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7123287671232876, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.9084967320261438, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8910256410256411, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16275979578495026, "eval_overall_accuracy": 0.9638700290979632, "eval_overall_f1": 0.8393351800554018, "eval_overall_precision": 0.808, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4053, "eval_samples_per_second": 461.392, "eval_steps_per_second": 7.402, "step": 5300 }, { "epoch": 51.0, "grad_norm": 1.0746209621429443, "learning_rate": 2.45e-05, "loss": 0.0251, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7819548872180452, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7647058823529411, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16527943313121796, "eval_overall_accuracy": 0.9662948593598448, "eval_overall_f1": 0.8444444444444444, "eval_overall_precision": 0.8150134048257373, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4037, "eval_samples_per_second": 463.197, "eval_steps_per_second": 7.431, "step": 5406 }, { "epoch": 52.0, "grad_norm": 1.7756356000900269, "learning_rate": 2.4e-05, "loss": 0.0245, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.76, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6705882352941176, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9044585987261147, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8658536585365854, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.18333446979522705, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.4031, "eval_samples_per_second": 463.928, "eval_steps_per_second": 7.443, "step": 5512 }, { "epoch": 53.0, "grad_norm": 0.80136638879776, "learning_rate": 2.35e-05, "loss": 0.0222, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.759493670886076, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6896551724137931, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9102564102564102, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8765432098765432, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1887245774269104, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.824631860776439, "eval_overall_precision": 0.77, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4031, "eval_samples_per_second": 463.882, "eval_steps_per_second": 7.442, "step": 5618 }, { "epoch": 54.0, "grad_norm": 1.39556086063385, "learning_rate": 2.3000000000000003e-05, "loss": 0.024, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9131832797427653, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8819875776397516, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17654088139533997, "eval_overall_accuracy": 0.9633850630455868, "eval_overall_f1": 0.8459459459459459, "eval_overall_precision": 0.7964376590330788, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.4024, "eval_samples_per_second": 464.697, "eval_steps_per_second": 7.455, "step": 5724 }, { "epoch": 55.0, "grad_norm": 1.3348910808563232, "learning_rate": 2.25e-05, "loss": 0.0238, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7755102040816327, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6951219512195121, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9190938511326862, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8930817610062893, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.9259259259259259, "eval_TIME_number": 28, "eval_TIME_precision": 0.9615384615384616, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1749105155467987, "eval_overall_accuracy": 0.9645974781765276, "eval_overall_f1": 0.8485675306957708, "eval_overall_precision": 0.805699481865285, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.4051, "eval_samples_per_second": 461.622, "eval_steps_per_second": 7.406, "step": 5830 }, { "epoch": 56.0, "grad_norm": 0.7062710523605347, "learning_rate": 2.2000000000000003e-05, "loss": 0.021, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.7483870967741935, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6904761904761905, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7397260273972603, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9096774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.88125, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17994269728660583, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8259109311740891, "eval_overall_precision": 0.7766497461928934, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4031, "eval_samples_per_second": 463.918, "eval_steps_per_second": 7.443, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.6525917053222656, "learning_rate": 2.15e-05, "loss": 0.0199, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7536231884057971, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7123287671232876, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.9102564102564102, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8765432098765432, "eval_PERSON_recall": 0.9466666666666667, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19421829283237457, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8422496570644719, "eval_overall_precision": 0.8036649214659686, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.4031, "eval_samples_per_second": 463.878, "eval_steps_per_second": 7.442, "step": 6042 }, { "epoch": 58.0, "grad_norm": 1.2534284591674805, "learning_rate": 2.1e-05, "loss": 0.0187, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.75, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7037037037037037, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7536231884057971, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7123287671232876, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.9055374592833875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8853503184713376, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19052091240882874, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8264462809917356, "eval_overall_precision": 0.7915567282321899, "eval_overall_recall": 0.8645533141210374, "eval_runtime": 0.4084, "eval_samples_per_second": 457.931, "eval_steps_per_second": 7.346, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.5067676305770874, "learning_rate": 2.05e-05, "loss": 0.0199, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.7581699346405228, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7073170731707317, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8070175438596492, "eval_TIME_number": 28, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.19398272037506104, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8246575342465754, "eval_overall_precision": 0.7859007832898173, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.404, "eval_samples_per_second": 462.903, "eval_steps_per_second": 7.426, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.6053163409233093, "learning_rate": 2e-05, "loss": 0.0183, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7417218543046358, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6511627906976745, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1951519399881363, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8276797829036635, "eval_overall_precision": 0.782051282051282, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4039, "eval_samples_per_second": 463.014, "eval_steps_per_second": 7.428, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.19502782821655273, "learning_rate": 1.9500000000000003e-05, "loss": 0.0178, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.7638888888888888, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7534246575342466, "eval_LOCATION_recall": 0.7746478873239436, "eval_ORGANIZATION_f1": 0.7724137931034483, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9055374592833875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8853503184713376, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.8450704225352113, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7894736842105263, "eval_QUANTITY_recall": 0.9090909090909091, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.190224289894104, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8386206896551723, "eval_overall_precision": 0.8042328042328042, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4062, "eval_samples_per_second": 460.355, "eval_steps_per_second": 7.385, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.6164102554321289, "learning_rate": 1.9e-05, "loss": 0.0196, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8214285714285714, "eval_TIME_number": 28, "eval_TIME_precision": 0.8214285714285714, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.18320535123348236, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8269230769230769, "eval_overall_precision": 0.7900262467191601, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.4026, "eval_samples_per_second": 464.456, "eval_steps_per_second": 7.451, "step": 6572 }, { "epoch": 63.0, "grad_norm": 1.624141812324524, "learning_rate": 1.85e-05, "loss": 0.0182, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7307692307692307, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8925081433224756, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8726114649681529, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.187962144613266, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8224043715846995, "eval_overall_precision": 0.7818181818181819, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.4039, "eval_samples_per_second": 462.956, "eval_steps_per_second": 7.427, "step": 6678 }, { "epoch": 64.0, "grad_norm": 1.540419340133667, "learning_rate": 1.8e-05, "loss": 0.0181, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7586206896551724, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19288307428359985, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8233695652173914, "eval_overall_precision": 0.7789203084832905, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4048, "eval_samples_per_second": 461.933, "eval_steps_per_second": 7.411, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.8278260231018066, "learning_rate": 1.75e-05, "loss": 0.0187, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7681159420289856, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.726027397260274, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8990228013029316, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8789808917197452, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19136402010917664, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8331034482758621, "eval_overall_precision": 0.798941798941799, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.4041, "eval_samples_per_second": 462.729, "eval_steps_per_second": 7.423, "step": 6890 }, { "epoch": 66.0, "grad_norm": 1.0269757509231567, "learning_rate": 1.7000000000000003e-05, "loss": 0.016, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7552447552447553, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9025974025974027, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.879746835443038, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20218557119369507, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8244897959183674, "eval_overall_precision": 0.7809278350515464, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4034, "eval_samples_per_second": 463.539, "eval_steps_per_second": 7.436, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.6365354061126709, "learning_rate": 1.65e-05, "loss": 0.0153, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.757142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7066666666666667, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9096774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.88125, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.19219978153705597, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8317373461012312, "eval_overall_precision": 0.7916666666666666, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4029, "eval_samples_per_second": 464.137, "eval_steps_per_second": 7.446, "step": 7102 }, { "epoch": 68.0, "grad_norm": 3.532707691192627, "learning_rate": 1.6000000000000003e-05, "loss": 0.0165, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9055374592833875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8853503184713376, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20774675905704498, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8256130790190734, "eval_overall_precision": 0.7829457364341085, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4026, "eval_samples_per_second": 464.494, "eval_steps_per_second": 7.452, "step": 7208 }, { "epoch": 69.0, "grad_norm": 1.3800381422042847, "learning_rate": 1.55e-05, "loss": 0.0159, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20177708566188812, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8321964529331515, "eval_overall_precision": 0.7901554404145078, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4055, "eval_samples_per_second": 461.121, "eval_steps_per_second": 7.398, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.4369199573993683, "learning_rate": 1.5e-05, "loss": 0.0151, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.7402597402597403, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6867469879518072, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.76056338028169, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7012987012987013, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9084967320261438, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8910256410256411, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21934795379638672, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8212824010914053, "eval_overall_precision": 0.7797927461139896, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.4045, "eval_samples_per_second": 462.289, "eval_steps_per_second": 7.416, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.6564136743545532, "learning_rate": 1.45e-05, "loss": 0.0149, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7671232876712328, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.691358024691358, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21174688637256622, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8353741496598639, "eval_overall_precision": 0.7912371134020618, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.4036, "eval_samples_per_second": 463.368, "eval_steps_per_second": 7.434, "step": 7526 }, { "epoch": 72.0, "grad_norm": 1.1040197610855103, "learning_rate": 1.4000000000000001e-05, "loss": 0.0152, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7746478873239436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8169014084507042, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7631578947368421, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8363636363636364, "eval_TIME_number": 28, "eval_TIME_precision": 0.8518518518518519, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.19948169589042664, "eval_overall_accuracy": 0.9624151309408342, "eval_overall_f1": 0.8370165745856354, "eval_overall_precision": 0.8037135278514589, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4055, "eval_samples_per_second": 461.114, "eval_steps_per_second": 7.398, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.12047336250543594, "learning_rate": 1.3500000000000001e-05, "loss": 0.0149, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.7612903225806451, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.912621359223301, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2207670509815216, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8324324324324324, "eval_overall_precision": 0.7837150127226463, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4058, "eval_samples_per_second": 460.775, "eval_steps_per_second": 7.392, "step": 7738 }, { "epoch": 74.0, "grad_norm": 1.3887410163879395, "learning_rate": 1.3000000000000001e-05, "loss": 0.0141, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.7567567567567568, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7272727272727273, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7769784172661871, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7297297297297297, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2141115963459015, "eval_overall_accuracy": 0.9624151309408342, "eval_overall_f1": 0.8370165745856354, "eval_overall_precision": 0.8037135278514589, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4026, "eval_samples_per_second": 464.486, "eval_steps_per_second": 7.452, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.22892561554908752, "learning_rate": 1.25e-05, "loss": 0.0142, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.7662337662337662, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7222222222222222, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6582278481012658, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.9055374592833875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8853503184713376, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.20973996818065643, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8283378746594005, "eval_overall_precision": 0.7855297157622739, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4054, "eval_samples_per_second": 461.245, "eval_steps_per_second": 7.4, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.28838738799095154, "learning_rate": 1.2e-05, "loss": 0.0132, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7517730496453899, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6973684210526315, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9096774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.88125, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2148653268814087, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8333333333333333, "eval_overall_precision": 0.7922077922077922, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.405, "eval_samples_per_second": 461.757, "eval_steps_per_second": 7.408, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.2209300547838211, "learning_rate": 1.1500000000000002e-05, "loss": 0.0132, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.7483870967741935, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6904761904761905, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7659574468085107, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7105263157894737, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.912621359223301, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8928571428571429, "eval_TIME_number": 28, "eval_TIME_precision": 0.8928571428571429, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.21584409475326538, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8321964529331515, "eval_overall_precision": 0.7901554404145078, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4041, "eval_samples_per_second": 462.714, "eval_steps_per_second": 7.423, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.5461943745613098, "learning_rate": 1.1000000000000001e-05, "loss": 0.0141, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.76056338028169, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7012987012987013, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9019607843137256, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8846153846153846, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20878075063228607, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8257887517146777, "eval_overall_precision": 0.7879581151832461, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.4053, "eval_samples_per_second": 461.363, "eval_steps_per_second": 7.402, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.6024172902107239, "learning_rate": 1.05e-05, "loss": 0.0117, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7737226277372263, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7361111111111112, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20918363332748413, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8358620689655172, "eval_overall_precision": 0.8015873015873016, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4026, "eval_samples_per_second": 464.472, "eval_steps_per_second": 7.451, "step": 8374 }, { "epoch": 80.0, "grad_norm": 1.4614003896713257, "learning_rate": 1e-05, "loss": 0.0127, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.7417218543046357, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2205442190170288, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8273972602739728, "eval_overall_precision": 0.7885117493472585, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.4027, "eval_samples_per_second": 464.311, "eval_steps_per_second": 7.449, "step": 8480 }, { "epoch": 81.0, "grad_norm": 1.915273666381836, "learning_rate": 9.5e-06, "loss": 0.0134, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7737226277372263, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7361111111111112, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20929260551929474, "eval_overall_accuracy": 0.9631425800193987, "eval_overall_f1": 0.8370165745856354, "eval_overall_precision": 0.8037135278514589, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4028, "eval_samples_per_second": 464.264, "eval_steps_per_second": 7.448, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.0925920009613037, "learning_rate": 9e-06, "loss": 0.0138, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7659574468085107, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7105263157894737, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9055374592833875, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8853503184713376, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.20777982473373413, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8351648351648351, "eval_overall_precision": 0.7979002624671916, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.404, "eval_samples_per_second": 462.894, "eval_steps_per_second": 7.426, "step": 8692 }, { "epoch": 83.0, "grad_norm": 1.2260353565216064, "learning_rate": 8.500000000000002e-06, "loss": 0.0129, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7417218543046357, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7692307692307693, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7051282051282052, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8996763754045306, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21702027320861816, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.825136612021858, "eval_overall_precision": 0.7844155844155845, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.4043, "eval_samples_per_second": 462.499, "eval_steps_per_second": 7.42, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.29825663566589355, "learning_rate": 8.000000000000001e-06, "loss": 0.0119, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.757142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7066666666666667, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.896103896103896, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8734177215189873, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2102896124124527, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8301369863013699, "eval_overall_precision": 0.7911227154046997, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.4038, "eval_samples_per_second": 463.06, "eval_steps_per_second": 7.429, "step": 8904 }, { "epoch": 85.0, "grad_norm": 2.5998857021331787, "learning_rate": 7.5e-06, "loss": 0.0117, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7755102040816327, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6951219512195121, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.912621359223301, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8070175438596492, "eval_TIME_number": 28, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.22094765305519104, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8346883468834688, "eval_overall_precision": 0.7877237851662404, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.4049, "eval_samples_per_second": 461.865, "eval_steps_per_second": 7.41, "step": 9010 }, { "epoch": 86.0, "grad_norm": 1.0339630842208862, "learning_rate": 7.000000000000001e-06, "loss": 0.0129, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7659574468085107, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7105263157894737, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2100267857313156, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8372093023255814, "eval_overall_precision": 0.796875, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4047, "eval_samples_per_second": 462.12, "eval_steps_per_second": 7.414, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.0695308968424797, "learning_rate": 6.5000000000000004e-06, "loss": 0.0107, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7692307692307693, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7051282051282052, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21508151292800903, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8372093023255814, "eval_overall_precision": 0.796875, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.407, "eval_samples_per_second": 459.502, "eval_steps_per_second": 7.372, "step": 9222 }, { "epoch": 88.0, "grad_norm": 1.1862696409225464, "learning_rate": 6e-06, "loss": 0.0121, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7659574468085107, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7105263157894737, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8990228013029316, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8789808917197452, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21262787282466888, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8319559228650137, "eval_overall_precision": 0.7968337730870713, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.4061, "eval_samples_per_second": 460.423, "eval_steps_per_second": 7.386, "step": 9328 }, { "epoch": 89.0, "grad_norm": 1.132206678390503, "learning_rate": 5.500000000000001e-06, "loss": 0.0104, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7857142857142856, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7333333333333333, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9090909090909091, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8860759493670886, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7887323943661972, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21018344163894653, "eval_overall_accuracy": 0.9631425800193987, "eval_overall_f1": 0.8402203856749312, "eval_overall_precision": 0.8047493403693932, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4076, "eval_samples_per_second": 458.732, "eval_steps_per_second": 7.359, "step": 9434 }, { "epoch": 90.0, "grad_norm": 0.5784242749214172, "learning_rate": 5e-06, "loss": 0.0114, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7826086956521738, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7397260273972602, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.21030160784721375, "eval_overall_accuracy": 0.9629000969932104, "eval_overall_f1": 0.837465564738292, "eval_overall_precision": 0.8021108179419525, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4106, "eval_samples_per_second": 455.383, "eval_steps_per_second": 7.306, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.3709010183811188, "learning_rate": 4.5e-06, "loss": 0.0105, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7769784172661871, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7297297297297297, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2143879383802414, "eval_overall_accuracy": 0.9629000969932104, "eval_overall_f1": 0.8367626886145404, "eval_overall_precision": 0.7984293193717278, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4069, "eval_samples_per_second": 459.523, "eval_steps_per_second": 7.372, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.19695152342319489, "learning_rate": 4.000000000000001e-06, "loss": 0.011, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.75, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7037037037037037, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7692307692307693, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7051282051282052, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22280381619930267, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.834924965893588, "eval_overall_precision": 0.7927461139896373, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4088, "eval_samples_per_second": 457.432, "eval_steps_per_second": 7.338, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.30122533440589905, "learning_rate": 3.5000000000000004e-06, "loss": 0.0107, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7552447552447553, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2211771309375763, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.834924965893588, "eval_overall_precision": 0.7927461139896373, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4094, "eval_samples_per_second": 456.814, "eval_steps_per_second": 7.329, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.1013573631644249, "learning_rate": 3e-06, "loss": 0.009, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7586206896551724, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2232343554496765, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8353741496598639, "eval_overall_precision": 0.7912371134020618, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.4075, "eval_samples_per_second": 458.923, "eval_steps_per_second": 7.362, "step": 9964 }, { "epoch": 95.0, "grad_norm": 1.0435041189193726, "learning_rate": 2.5e-06, "loss": 0.0109, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.7450980392156863, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6951219512195121, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7552447552447553, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.9120521172638437, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.89171974522293, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.22744058072566986, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8306010928961749, "eval_overall_precision": 0.7896103896103897, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.407, "eval_samples_per_second": 459.405, "eval_steps_per_second": 7.37, "step": 10070 }, { "epoch": 96.0, "grad_norm": 4.114624500274658, "learning_rate": 2.0000000000000003e-06, "loss": 0.0098, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7692307692307693, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7051282051282052, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.22330667078495026, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8387978142076504, "eval_overall_precision": 0.7974025974025974, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.4058, "eval_samples_per_second": 460.857, "eval_steps_per_second": 7.393, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.8480021953582764, "learning_rate": 1.5e-06, "loss": 0.0103, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.763888888888889, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6962025316455697, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22035245597362518, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8283378746594005, "eval_overall_precision": 0.7855297157622739, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.4072, "eval_samples_per_second": 459.182, "eval_steps_per_second": 7.367, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.7559491395950317, "learning_rate": 1.0000000000000002e-06, "loss": 0.0102, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.763888888888889, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6962025316455697, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.2218533307313919, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.834924965893588, "eval_overall_precision": 0.7927461139896373, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4081, "eval_samples_per_second": 458.203, "eval_steps_per_second": 7.351, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.24367158114910126, "learning_rate": 5.000000000000001e-07, "loss": 0.0094, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.763888888888889, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6962025316455697, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22336292266845703, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8321964529331515, "eval_overall_precision": 0.7901554404145078, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.4081, "eval_samples_per_second": 458.197, "eval_steps_per_second": 7.351, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.0760447159409523, "learning_rate": 0.0, "loss": 0.0098, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.763888888888889, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6962025316455697, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9155844155844156, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8924050632911392, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.22373317182064056, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.834924965893588, "eval_overall_precision": 0.7927461139896373, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.4055, "eval_samples_per_second": 461.127, "eval_steps_per_second": 7.398, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5189413292285520.0, "train_loss": 0.055730826843459653, "train_runtime": 962.8691, "train_samples_per_second": 175.309, "train_steps_per_second": 11.009 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5189413292285520.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }