|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 2.502664804458618, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9512, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.013071895424836602, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.3333333333333333, |
|
"eval_PERSON_recall": 0.006666666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.6040259599685669, |
|
"eval_overall_accuracy": 0.8411736178467507, |
|
"eval_overall_f1": 0.005714285714285714, |
|
"eval_overall_precision": 0.3333333333333333, |
|
"eval_overall_recall": 0.002881844380403458, |
|
"eval_runtime": 0.4042, |
|
"eval_samples_per_second": 462.684, |
|
"eval_steps_per_second": 7.423, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.1181972026824951, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.5021, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.467741935483871, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5471698113207547, |
|
"eval_LOCATION_recall": 0.4084507042253521, |
|
"eval_ORGANIZATION_f1": 0.203125, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.20634920634920634, |
|
"eval_ORGANIZATION_recall": 0.2, |
|
"eval_PERSON_f1": 0.6997084548104956, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.6217616580310881, |
|
"eval_PERSON_recall": 0.8, |
|
"eval_QUANTITY_f1": 0.1904761904761905, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.2, |
|
"eval_QUANTITY_recall": 0.18181818181818182, |
|
"eval_TIME_f1": 0.49180327868852464, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.45454545454545453, |
|
"eval_TIME_recall": 0.5357142857142857, |
|
"eval_loss": 0.3378148674964905, |
|
"eval_overall_accuracy": 0.9076139670223085, |
|
"eval_overall_f1": 0.5090403337969402, |
|
"eval_overall_precision": 0.49193548387096775, |
|
"eval_overall_recall": 0.5273775216138329, |
|
"eval_runtime": 0.4075, |
|
"eval_samples_per_second": 458.866, |
|
"eval_steps_per_second": 7.361, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.0774222612380981, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.2912, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.6289308176100629, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5681818181818182, |
|
"eval_LOCATION_recall": 0.704225352112676, |
|
"eval_ORGANIZATION_f1": 0.5970149253731344, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5797101449275363, |
|
"eval_ORGANIZATION_recall": 0.6153846153846154, |
|
"eval_PERSON_f1": 0.8291139240506329, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7891566265060241, |
|
"eval_PERSON_recall": 0.8733333333333333, |
|
"eval_QUANTITY_f1": 0.5405405405405406, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.4878048780487805, |
|
"eval_QUANTITY_recall": 0.6060606060606061, |
|
"eval_TIME_f1": 0.830188679245283, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.88, |
|
"eval_TIME_recall": 0.7857142857142857, |
|
"eval_loss": 0.18643514811992645, |
|
"eval_overall_accuracy": 0.9376818622696411, |
|
"eval_overall_f1": 0.7146739130434783, |
|
"eval_overall_precision": 0.6760925449871465, |
|
"eval_overall_recall": 0.7579250720461095, |
|
"eval_runtime": 0.4093, |
|
"eval_samples_per_second": 456.848, |
|
"eval_steps_per_second": 7.329, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.0147018432617188, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.1943, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.7142857142857142, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6185567010309279, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6790123456790124, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5670103092783505, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.85625, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8058823529411765, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6829268292682927, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5714285714285714, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1579989790916443, |
|
"eval_overall_accuracy": 0.9478661493695442, |
|
"eval_overall_f1": 0.7715736040609138, |
|
"eval_overall_precision": 0.6893424036281179, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4082, |
|
"eval_samples_per_second": 458.117, |
|
"eval_steps_per_second": 7.349, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.6936546564102173, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1653, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.7228915662650601, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.631578947368421, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6712328767123288, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6049382716049383, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8626198083067093, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8282208588957055, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.8, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13640257716178894, |
|
"eval_overall_accuracy": 0.9524733268671193, |
|
"eval_overall_f1": 0.7842105263157895, |
|
"eval_overall_precision": 0.7215496368038741, |
|
"eval_overall_recall": 0.8587896253602305, |
|
"eval_runtime": 0.4066, |
|
"eval_samples_per_second": 459.951, |
|
"eval_steps_per_second": 7.379, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.5403629541397095, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.152, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7272727272727273, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6382978723404256, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5567010309278351, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8553846153846154, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7942857142857143, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7088607594936709, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6086956521739131, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.6969696969696969, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6052631578947368, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.15786363184452057, |
|
"eval_overall_accuracy": 0.944713870029098, |
|
"eval_overall_f1": 0.7628607277289837, |
|
"eval_overall_precision": 0.6755555555555556, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.408, |
|
"eval_samples_per_second": 458.337, |
|
"eval_steps_per_second": 7.353, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 2.2046146392822266, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1379, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7439024390243902, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6559139784946236, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7012987012987013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6067415730337079, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8553846153846154, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7942857142857143, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6341463414634148, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5306122448979592, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.7076923076923075, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6216216216216216, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.15319040417671204, |
|
"eval_overall_accuracy": 0.9464112512124151, |
|
"eval_overall_f1": 0.7670886075949368, |
|
"eval_overall_precision": 0.6839729119638827, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4079, |
|
"eval_samples_per_second": 458.417, |
|
"eval_steps_per_second": 7.354, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.8930031061172485, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.125, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7425149700598803, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6458333333333334, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6962025316455697, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5913978494623656, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12710979580879211, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.7979139504563234, |
|
"eval_overall_precision": 0.7285714285714285, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4046, |
|
"eval_samples_per_second": 462.173, |
|
"eval_steps_per_second": 7.415, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.0148112773895264, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1161, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7320261437908497, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6829268292682927, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.6707317073170732, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5555555555555556, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12680365145206451, |
|
"eval_overall_accuracy": 0.954898157129001, |
|
"eval_overall_f1": 0.793148880105402, |
|
"eval_overall_precision": 0.7305825242718447, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.4068, |
|
"eval_samples_per_second": 459.728, |
|
"eval_steps_per_second": 7.375, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.5242857933044434, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1124, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7532467532467533, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6987951807228916, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8860759493670886, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8433734939759037, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12313192337751389, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8074866310160428, |
|
"eval_overall_precision": 0.7531172069825436, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.4064, |
|
"eval_samples_per_second": 460.091, |
|
"eval_steps_per_second": 7.381, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.9723674058914185, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1059, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7532467532467533, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6987951807228916, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7142857142857142, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1203012615442276, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8048780487804879, |
|
"eval_overall_precision": 0.7595907928388747, |
|
"eval_overall_recall": 0.8559077809798271, |
|
"eval_runtime": 0.4057, |
|
"eval_samples_per_second": 460.934, |
|
"eval_steps_per_second": 7.395, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.34227454662323, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.0975, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.7341772151898733, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6666666666666666, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.6956521739130436, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5833333333333334, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.86875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8176470588235294, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.78125, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1370622217655182, |
|
"eval_overall_accuracy": 0.9527158098933075, |
|
"eval_overall_f1": 0.7906976744186047, |
|
"eval_overall_precision": 0.7166276346604216, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4061, |
|
"eval_samples_per_second": 460.527, |
|
"eval_steps_per_second": 7.388, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.8592511415481567, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.0915, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.7712418300653594, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7199999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6352941176470588, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8952380952380952, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8545454545454545, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12159363925457001, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8225806451612904, |
|
"eval_overall_precision": 0.7707808564231738, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4059, |
|
"eval_samples_per_second": 460.692, |
|
"eval_steps_per_second": 7.391, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 3.151130437850952, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.0913, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.76, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7215189873417721, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7464788732394366, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6883116883116883, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.11676321178674698, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8335625859697388, |
|
"eval_overall_precision": 0.7973684210526316, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4073, |
|
"eval_samples_per_second": 459.097, |
|
"eval_steps_per_second": 7.365, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.3836969137191772, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.0853, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.794701986754967, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12170998007059097, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8241610738255033, |
|
"eval_overall_precision": 0.7713567839195979, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.412, |
|
"eval_samples_per_second": 453.856, |
|
"eval_steps_per_second": 7.281, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 1.1944974660873413, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0809, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13052447140216827, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8180610889774237, |
|
"eval_overall_precision": 0.7586206896551724, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4077, |
|
"eval_samples_per_second": 458.719, |
|
"eval_steps_per_second": 7.359, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 1.1874595880508423, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0773, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7692307692307694, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6136363636363636, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8980891719745222, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12760519981384277, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8148148148148148, |
|
"eval_overall_precision": 0.7530562347188264, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4077, |
|
"eval_samples_per_second": 458.725, |
|
"eval_steps_per_second": 7.359, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 1.0034806728363037, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0737, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.7407407407407407, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6593406593406593, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6967741935483871, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8840125391849529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.834319526627219, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7796610169491526, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7419354838709677, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.15325599908828735, |
|
"eval_overall_accuracy": 0.9493210475266731, |
|
"eval_overall_f1": 0.7911802853437095, |
|
"eval_overall_precision": 0.7193396226415094, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4065, |
|
"eval_samples_per_second": 460.02, |
|
"eval_steps_per_second": 7.38, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 1.108689785003662, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0703, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7534246575342466, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6790123456790124, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8990228013029316, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8789808917197452, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1193038821220398, |
|
"eval_overall_accuracy": 0.9631425800193987, |
|
"eval_overall_f1": 0.8290013679890561, |
|
"eval_overall_precision": 0.7890625, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.408, |
|
"eval_samples_per_second": 458.324, |
|
"eval_steps_per_second": 7.353, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 1.1755281686782837, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0713, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7236842105263158, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.632183908045977, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.912621359223301, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.9259259259259259, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9615384615384616, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12470389902591705, |
|
"eval_overall_accuracy": 0.9624151309408342, |
|
"eval_overall_f1": 0.829530201342282, |
|
"eval_overall_precision": 0.7763819095477387, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.4074, |
|
"eval_samples_per_second": 458.981, |
|
"eval_steps_per_second": 7.363, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 1.2563973665237427, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0649, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5894736842105263, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13802851736545563, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.80946123521682, |
|
"eval_overall_precision": 0.7439613526570048, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4074, |
|
"eval_samples_per_second": 459.06, |
|
"eval_steps_per_second": 7.365, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.8472046852111816, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0645, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.75, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7037037037037037, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14445021748542786, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8221024258760108, |
|
"eval_overall_precision": 0.7721518987341772, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4092, |
|
"eval_samples_per_second": 456.965, |
|
"eval_steps_per_second": 7.331, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.0579193830490112, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0595, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.759493670886076, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6896551724137931, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6136363636363636, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13738445937633514, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8284182305630027, |
|
"eval_overall_precision": 0.7744360902255639, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.4089, |
|
"eval_samples_per_second": 457.323, |
|
"eval_steps_per_second": 7.337, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.30304753780365, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0576, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.7692307692307694, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7172413793103448, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14021030068397522, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8276797829036635, |
|
"eval_overall_precision": 0.782051282051282, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.408, |
|
"eval_samples_per_second": 458.303, |
|
"eval_steps_per_second": 7.352, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.7619758248329163, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0562, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.7692307692307694, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.708860759493671, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6021505376344086, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15844029188156128, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.80946123521682, |
|
"eval_overall_precision": 0.7439613526570048, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4076, |
|
"eval_samples_per_second": 458.809, |
|
"eval_steps_per_second": 7.361, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.3145362138748169, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0533, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.7466666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7088607594936709, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.7248322147651007, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6842105263157895, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6046511627906976, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1501431167125702, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.8058902275769746, |
|
"eval_overall_precision": 0.7525, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.4072, |
|
"eval_samples_per_second": 459.248, |
|
"eval_steps_per_second": 7.368, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.4819648265838623, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0529, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15187156200408936, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8229027962716378, |
|
"eval_overall_precision": 0.7648514851485149, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.4068, |
|
"eval_samples_per_second": 459.716, |
|
"eval_steps_per_second": 7.375, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 0.8129953145980835, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0531, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.802721088435374, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7763157894736842, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7702702702702702, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6867469879518072, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13637924194335938, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8372093023255814, |
|
"eval_overall_precision": 0.796875, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.406, |
|
"eval_samples_per_second": 460.578, |
|
"eval_steps_per_second": 7.389, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.46542084217071533, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0463, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.7702702702702703, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7402597402597403, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6551724137931034, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9038461538461539, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8405797101449276, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8055555555555556, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13960041105747223, |
|
"eval_overall_accuracy": 0.9624151309408342, |
|
"eval_overall_f1": 0.835820895522388, |
|
"eval_overall_precision": 0.7897435897435897, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4068, |
|
"eval_samples_per_second": 459.668, |
|
"eval_steps_per_second": 7.374, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.8071898818016052, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0466, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.7919463087248323, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7564102564102564, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7261146496815286, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6195652173913043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1534765511751175, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.824631860776439, |
|
"eval_overall_precision": 0.77, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4052, |
|
"eval_samples_per_second": 461.503, |
|
"eval_steps_per_second": 7.404, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.7920342087745667, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0449, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6835443037974683, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9102564102564102, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16083230078220367, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8306451612903226, |
|
"eval_overall_precision": 0.7783375314861462, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.4039, |
|
"eval_samples_per_second": 462.994, |
|
"eval_steps_per_second": 7.428, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.9836466908454895, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.043, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.751592356687898, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.686046511627907, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6136363636363636, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9102564102564102, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.6933333333333334, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6190476190476191, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16350191831588745, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8095238095238096, |
|
"eval_overall_precision": 0.7481662591687042, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4041, |
|
"eval_samples_per_second": 462.793, |
|
"eval_steps_per_second": 7.424, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.8012641668319702, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0394, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.7755102040816326, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9220779220779222, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8987341772151899, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15030378103256226, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8402203856749312, |
|
"eval_overall_precision": 0.8047493403693932, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4047, |
|
"eval_samples_per_second": 462.071, |
|
"eval_steps_per_second": 7.413, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 0.9052590727806091, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0412, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.7972972972972973, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7662337662337663, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9220779220779222, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8987341772151899, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1466250866651535, |
|
"eval_overall_accuracy": 0.9645974781765276, |
|
"eval_overall_f1": 0.8481532147742818, |
|
"eval_overall_precision": 0.8072916666666666, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.4032, |
|
"eval_samples_per_second": 463.733, |
|
"eval_steps_per_second": 7.44, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.42126646637916565, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0403, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9102564102564102, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15250608325004578, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8268456375838926, |
|
"eval_overall_precision": 0.7738693467336684, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4038, |
|
"eval_samples_per_second": 463.06, |
|
"eval_steps_per_second": 7.429, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 1.7094526290893555, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0385, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.7919463087248323, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7564102564102564, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7354838709677419, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6333333333333333, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8958990536277603, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8502994011976048, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1817101240158081, |
|
"eval_overall_accuracy": 0.9551406401551892, |
|
"eval_overall_f1": 0.8233731739707836, |
|
"eval_overall_precision": 0.7635467980295566, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.4033, |
|
"eval_samples_per_second": 463.63, |
|
"eval_steps_per_second": 7.438, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 1.976254940032959, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.037, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.7435897435897436, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6823529411764706, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7152317880794703, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8511904761904762, |
|
"eval_PERSON_recall": 0.9533333333333334, |
|
"eval_QUANTITY_f1": 0.6582278481012658, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5652173913043478, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2011863738298416, |
|
"eval_overall_accuracy": 0.9517458777885548, |
|
"eval_overall_f1": 0.799475753604194, |
|
"eval_overall_precision": 0.7331730769230769, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4048, |
|
"eval_samples_per_second": 461.918, |
|
"eval_steps_per_second": 7.41, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 1.1307073831558228, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.037, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.7837837837837838, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7532467532467533, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7681159420289856, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.726027397260274, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.9259259259259259, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9615384615384616, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1582067906856537, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8381742738589211, |
|
"eval_overall_precision": 0.8058510638297872, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4045, |
|
"eval_samples_per_second": 462.274, |
|
"eval_steps_per_second": 7.416, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.8394156694412231, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0332, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.794701986754967, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.76, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6705882352941176, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9108280254777071, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.9533333333333334, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16989700496196747, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8360215053763441, |
|
"eval_overall_precision": 0.783375314861461, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.4173, |
|
"eval_samples_per_second": 448.072, |
|
"eval_steps_per_second": 7.188, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.8886793255805969, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0354, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.794701986754967, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7412587412587412, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6794871794871795, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9073482428115016, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1586233377456665, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8274932614555257, |
|
"eval_overall_precision": 0.7772151898734178, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.4013, |
|
"eval_samples_per_second": 465.977, |
|
"eval_steps_per_second": 7.476, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.6773855686187744, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0331, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7619047619047619, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6829268292682927, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9025974025974027, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.879746835443038, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16328278183937073, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8286099865047233, |
|
"eval_overall_precision": 0.7791878172588832, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.4108, |
|
"eval_samples_per_second": 455.24, |
|
"eval_steps_per_second": 7.303, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.5810602903366089, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0312, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9009584664536742, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1705748438835144, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.824966078697422, |
|
"eval_overall_precision": 0.7794871794871795, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4042, |
|
"eval_samples_per_second": 462.62, |
|
"eval_steps_per_second": 7.422, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 1.03245210647583, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.031, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7482014388489208, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7027027027027027, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9073482428115016, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.821917808219178, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16453760862350464, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8362652232746954, |
|
"eval_overall_precision": 0.7882653061224489, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.4028, |
|
"eval_samples_per_second": 464.207, |
|
"eval_steps_per_second": 7.447, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 1.3175857067108154, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0305, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.7843137254901961, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7549668874172185, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9044585987261147, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1853325217962265, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8326639892904953, |
|
"eval_overall_precision": 0.7775, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.4048, |
|
"eval_samples_per_second": 462.013, |
|
"eval_steps_per_second": 7.412, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 2.4794533252716064, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0284, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.7866666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.757142857142857, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7066666666666667, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9025974025974027, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.879746835443038, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16584299504756927, |
|
"eval_overall_accuracy": 0.9633850630455868, |
|
"eval_overall_f1": 0.8308115543328748, |
|
"eval_overall_precision": 0.7947368421052632, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.4049, |
|
"eval_samples_per_second": 461.854, |
|
"eval_steps_per_second": 7.409, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 1.2760629653930664, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.028, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.7581699346405228, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7073170731707317, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7210884353741497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6463414634146342, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.912621359223301, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17332231998443604, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.8238482384823849, |
|
"eval_overall_precision": 0.7774936061381074, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4033, |
|
"eval_samples_per_second": 463.665, |
|
"eval_steps_per_second": 7.438, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.9426093101501465, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0257, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.802721088435374, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7763157894736842, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7368421052631579, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6436781609195402, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9073482428115016, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18327540159225464, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.834008097165992, |
|
"eval_overall_precision": 0.7842639593908629, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.4078, |
|
"eval_samples_per_second": 458.511, |
|
"eval_steps_per_second": 7.356, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 0.6249455213546753, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0281, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.7837837837837838, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7532467532467533, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7310344827586207, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6625, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8518518518518519, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8846153846153846, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.17024332284927368, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.823529411764706, |
|
"eval_overall_precision": 0.7838541666666666, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.4064, |
|
"eval_samples_per_second": 460.192, |
|
"eval_steps_per_second": 7.383, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.06978233903646469, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0245, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9131832797427653, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8819875776397516, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18626831471920013, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8279569892473119, |
|
"eval_overall_precision": 0.7758186397984886, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4028, |
|
"eval_samples_per_second": 464.25, |
|
"eval_steps_per_second": 7.448, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 2.4998741149902344, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0251, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.7866666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7536231884057971, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7123287671232876, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16275979578495026, |
|
"eval_overall_accuracy": 0.9638700290979632, |
|
"eval_overall_f1": 0.8393351800554018, |
|
"eval_overall_precision": 0.808, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4053, |
|
"eval_samples_per_second": 461.392, |
|
"eval_steps_per_second": 7.402, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 1.0746209621429443, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0251, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7819548872180452, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7647058823529411, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16527943313121796, |
|
"eval_overall_accuracy": 0.9662948593598448, |
|
"eval_overall_f1": 0.8444444444444444, |
|
"eval_overall_precision": 0.8150134048257373, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4037, |
|
"eval_samples_per_second": 463.197, |
|
"eval_steps_per_second": 7.431, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 1.7756356000900269, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0245, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.7866666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.76, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6705882352941176, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9044585987261147, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.18333446979522705, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8306451612903226, |
|
"eval_overall_precision": 0.7783375314861462, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.4031, |
|
"eval_samples_per_second": 463.928, |
|
"eval_steps_per_second": 7.443, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.80136638879776, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0222, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.759493670886076, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6896551724137931, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9102564102564102, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1887245774269104, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.824631860776439, |
|
"eval_overall_precision": 0.77, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4031, |
|
"eval_samples_per_second": 463.882, |
|
"eval_steps_per_second": 7.442, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 1.39556086063385, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.024, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.7919463087248323, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7564102564102564, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7682119205298013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6744186046511628, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9131832797427653, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8819875776397516, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17654088139533997, |
|
"eval_overall_accuracy": 0.9633850630455868, |
|
"eval_overall_f1": 0.8459459459459459, |
|
"eval_overall_precision": 0.7964376590330788, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.4024, |
|
"eval_samples_per_second": 464.697, |
|
"eval_steps_per_second": 7.455, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 1.3348910808563232, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0238, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.7866666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9190938511326862, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8930817610062893, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.9259259259259259, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9615384615384616, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1749105155467987, |
|
"eval_overall_accuracy": 0.9645974781765276, |
|
"eval_overall_f1": 0.8485675306957708, |
|
"eval_overall_precision": 0.805699481865285, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.4051, |
|
"eval_samples_per_second": 461.622, |
|
"eval_steps_per_second": 7.406, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.7062710523605347, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.021, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.7483870967741935, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6904761904761905, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7397260273972603, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9096774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.88125, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17994269728660583, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8259109311740891, |
|
"eval_overall_precision": 0.7766497461928934, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4031, |
|
"eval_samples_per_second": 463.918, |
|
"eval_steps_per_second": 7.443, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.6525917053222656, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0199, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7536231884057971, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7123287671232876, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9102564102564102, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19421829283237457, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8422496570644719, |
|
"eval_overall_precision": 0.8036649214659686, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.4031, |
|
"eval_samples_per_second": 463.878, |
|
"eval_steps_per_second": 7.442, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 1.2534284591674805, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0187, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.75, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7037037037037037, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7536231884057971, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7123287671232876, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19052091240882874, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8264462809917356, |
|
"eval_overall_precision": 0.7915567282321899, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.4084, |
|
"eval_samples_per_second": 457.931, |
|
"eval_steps_per_second": 7.346, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.5067676305770874, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0199, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.7581699346405228, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7073170731707317, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7464788732394366, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6883116883116883, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9019607843137256, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8846153846153846, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8070175438596492, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7931034482758621, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.19398272037506104, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8246575342465754, |
|
"eval_overall_precision": 0.7859007832898173, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.404, |
|
"eval_samples_per_second": 462.903, |
|
"eval_steps_per_second": 7.426, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.6053163409233093, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0183, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1951519399881363, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.8276797829036635, |
|
"eval_overall_precision": 0.782051282051282, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4039, |
|
"eval_samples_per_second": 463.014, |
|
"eval_steps_per_second": 7.428, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.19502782821655273, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0178, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.7638888888888888, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7534246575342466, |
|
"eval_LOCATION_recall": 0.7746478873239436, |
|
"eval_ORGANIZATION_f1": 0.7724137931034483, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.190224289894104, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8386206896551723, |
|
"eval_overall_precision": 0.8042328042328042, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4062, |
|
"eval_samples_per_second": 460.355, |
|
"eval_steps_per_second": 7.385, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.6164102554321289, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0196, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6835443037974683, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8925081433224756, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8726114649681529, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8214285714285714, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8214285714285714, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.18320535123348236, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8269230769230769, |
|
"eval_overall_precision": 0.7900262467191601, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.4026, |
|
"eval_samples_per_second": 464.456, |
|
"eval_steps_per_second": 7.451, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 1.624141812324524, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0182, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.7651006711409397, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7307692307692307, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7619047619047619, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6829268292682927, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8925081433224756, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8726114649681529, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.187962144613266, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.8224043715846995, |
|
"eval_overall_precision": 0.7818181818181819, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.4039, |
|
"eval_samples_per_second": 462.956, |
|
"eval_steps_per_second": 7.427, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 1.540419340133667, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0181, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.7682119205298014, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7586206896551724, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.19288307428359985, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8233695652173914, |
|
"eval_overall_precision": 0.7789203084832905, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4048, |
|
"eval_samples_per_second": 461.933, |
|
"eval_steps_per_second": 7.411, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.8278260231018066, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0187, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7681159420289856, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.726027397260274, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8990228013029316, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8789808917197452, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19136402010917664, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8331034482758621, |
|
"eval_overall_precision": 0.798941798941799, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.4041, |
|
"eval_samples_per_second": 462.729, |
|
"eval_steps_per_second": 7.423, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 1.0269757509231567, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.016, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.7712418300653594, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7552447552447553, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9025974025974027, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.879746835443038, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.20218557119369507, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8244897959183674, |
|
"eval_overall_precision": 0.7809278350515464, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4034, |
|
"eval_samples_per_second": 463.539, |
|
"eval_steps_per_second": 7.436, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.6365354061126709, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0153, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7125, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.757142857142857, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7066666666666667, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9096774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.88125, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.19219978153705597, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8317373461012312, |
|
"eval_overall_precision": 0.7916666666666666, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4029, |
|
"eval_samples_per_second": 464.137, |
|
"eval_steps_per_second": 7.446, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 3.532707691192627, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0165, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.76, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7215189873417721, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.20774675905704498, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8256130790190734, |
|
"eval_overall_precision": 0.7829457364341085, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4026, |
|
"eval_samples_per_second": 464.494, |
|
"eval_steps_per_second": 7.452, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 1.3800381422042847, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0159, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7125, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6835443037974683, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9090909090909091, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8860759493670886, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20177708566188812, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8321964529331515, |
|
"eval_overall_precision": 0.7901554404145078, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4055, |
|
"eval_samples_per_second": 461.121, |
|
"eval_steps_per_second": 7.398, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.4369199573993683, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0151, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.7402597402597403, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6867469879518072, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.76056338028169, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7012987012987013, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21934795379638672, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8212824010914053, |
|
"eval_overall_precision": 0.7797927461139896, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.4045, |
|
"eval_samples_per_second": 462.289, |
|
"eval_steps_per_second": 7.416, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.6564136743545532, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0149, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7671232876712328, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.691358024691358, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9090909090909091, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8860759493670886, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21174688637256622, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8353741496598639, |
|
"eval_overall_precision": 0.7912371134020618, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.4036, |
|
"eval_samples_per_second": 463.368, |
|
"eval_steps_per_second": 7.434, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 1.1040197610855103, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0152, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.7733333333333333, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7746478873239436, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7142857142857143, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9019607843137256, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8846153846153846, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8363636363636364, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8518518518518519, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.19948169589042664, |
|
"eval_overall_accuracy": 0.9624151309408342, |
|
"eval_overall_f1": 0.8370165745856354, |
|
"eval_overall_precision": 0.8037135278514589, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4055, |
|
"eval_samples_per_second": 461.114, |
|
"eval_steps_per_second": 7.398, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.12047336250543594, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0149, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.7612903225806451, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7023809523809523, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7619047619047619, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6829268292682927, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.912621359223301, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2207670509815216, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8324324324324324, |
|
"eval_overall_precision": 0.7837150127226463, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4058, |
|
"eval_samples_per_second": 460.775, |
|
"eval_steps_per_second": 7.392, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.3887410163879395, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0141, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.7567567567567568, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7272727272727273, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.7769784172661871, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7297297297297297, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2141115963459015, |
|
"eval_overall_accuracy": 0.9624151309408342, |
|
"eval_overall_f1": 0.8370165745856354, |
|
"eval_overall_precision": 0.8037135278514589, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4026, |
|
"eval_samples_per_second": 464.486, |
|
"eval_steps_per_second": 7.452, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.22892561554908752, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0142, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.7662337662337662, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7108433734939759, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7222222222222222, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6582278481012658, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20973996818065643, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8283378746594005, |
|
"eval_overall_precision": 0.7855297157622739, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4054, |
|
"eval_samples_per_second": 461.245, |
|
"eval_steps_per_second": 7.4, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.28838738799095154, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0132, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7517730496453899, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6973684210526315, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9096774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.88125, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2148653268814087, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8333333333333333, |
|
"eval_overall_precision": 0.7922077922077922, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.405, |
|
"eval_samples_per_second": 461.757, |
|
"eval_steps_per_second": 7.408, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.2209300547838211, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0132, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.7483870967741935, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6904761904761905, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7659574468085107, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7105263157894737, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.912621359223301, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.21584409475326538, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8321964529331515, |
|
"eval_overall_precision": 0.7901554404145078, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4041, |
|
"eval_samples_per_second": 462.714, |
|
"eval_steps_per_second": 7.423, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.5461943745613098, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0141, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7125, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.76056338028169, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7012987012987013, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9019607843137256, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8846153846153846, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.20878075063228607, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8257887517146777, |
|
"eval_overall_precision": 0.7879581151832461, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.4053, |
|
"eval_samples_per_second": 461.363, |
|
"eval_steps_per_second": 7.402, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.6024172902107239, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0117, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7125, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7737226277372263, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7361111111111112, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9090909090909091, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8860759493670886, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.20918363332748413, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8358620689655172, |
|
"eval_overall_precision": 0.8015873015873016, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4026, |
|
"eval_samples_per_second": 464.472, |
|
"eval_steps_per_second": 7.451, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 1.4614003896713257, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0127, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.7417218543046357, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6835443037974683, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9090909090909091, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8860759493670886, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8727272727272727, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8888888888888888, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2205442190170288, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8273972602739728, |
|
"eval_overall_precision": 0.7885117493472585, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.4027, |
|
"eval_samples_per_second": 464.311, |
|
"eval_steps_per_second": 7.449, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 1.915273666381836, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0134, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.76, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7215189873417721, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7737226277372263, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7361111111111112, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9090909090909091, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8860759493670886, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.20929260551929474, |
|
"eval_overall_accuracy": 0.9631425800193987, |
|
"eval_overall_f1": 0.8370165745856354, |
|
"eval_overall_precision": 0.8037135278514589, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4028, |
|
"eval_samples_per_second": 464.264, |
|
"eval_steps_per_second": 7.448, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.0925920009613037, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0138, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.7682119205298014, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7659574468085107, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7105263157894737, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.20777982473373413, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8351648351648351, |
|
"eval_overall_precision": 0.7979002624671916, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.404, |
|
"eval_samples_per_second": 462.894, |
|
"eval_steps_per_second": 7.426, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 1.2260353565216064, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0129, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.7417218543046357, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.7692307692307693, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7051282051282052, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21702027320861816, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.825136612021858, |
|
"eval_overall_precision": 0.7844155844155845, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.4043, |
|
"eval_samples_per_second": 462.499, |
|
"eval_steps_per_second": 7.42, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.29825663566589355, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0119, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.7712418300653594, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.757142857142857, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7066666666666667, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.896103896103896, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8734177215189873, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2102896124124527, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8301369863013699, |
|
"eval_overall_precision": 0.7911227154046997, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.4038, |
|
"eval_samples_per_second": 463.06, |
|
"eval_steps_per_second": 7.429, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 2.5998857021331787, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0117, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.912621359223301, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8070175438596492, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7931034482758621, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.22094765305519104, |
|
"eval_overall_accuracy": 0.9597478176527643, |
|
"eval_overall_f1": 0.8346883468834688, |
|
"eval_overall_precision": 0.7877237851662404, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4049, |
|
"eval_samples_per_second": 461.865, |
|
"eval_steps_per_second": 7.41, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 1.0339630842208862, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0129, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7659574468085107, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7105263157894737, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2100267857313156, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8372093023255814, |
|
"eval_overall_precision": 0.796875, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4047, |
|
"eval_samples_per_second": 462.12, |
|
"eval_steps_per_second": 7.414, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.0695308968424797, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0107, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7125, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7692307692307693, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7051282051282052, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21508151292800903, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.8372093023255814, |
|
"eval_overall_precision": 0.796875, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.407, |
|
"eval_samples_per_second": 459.502, |
|
"eval_steps_per_second": 7.372, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 1.1862696409225464, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0121, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.7733333333333333, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7659574468085107, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7105263157894737, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8990228013029316, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8789808917197452, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21262787282466888, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8319559228650137, |
|
"eval_overall_precision": 0.7968337730870713, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.4061, |
|
"eval_samples_per_second": 460.423, |
|
"eval_steps_per_second": 7.386, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 1.132206678390503, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0104, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.7733333333333333, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7857142857142856, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7333333333333333, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9090909090909091, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8860759493670886, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21018344163894653, |
|
"eval_overall_accuracy": 0.9631425800193987, |
|
"eval_overall_f1": 0.8402203856749312, |
|
"eval_overall_precision": 0.8047493403693932, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4076, |
|
"eval_samples_per_second": 458.732, |
|
"eval_steps_per_second": 7.359, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.5784242749214172, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0114, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.7682119205298014, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7826086956521738, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7397260273972602, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21030160784721375, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.837465564738292, |
|
"eval_overall_precision": 0.8021108179419525, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4106, |
|
"eval_samples_per_second": 455.383, |
|
"eval_steps_per_second": 7.306, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.3709010183811188, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0105, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7769784172661871, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7297297297297297, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2143879383802414, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8367626886145404, |
|
"eval_overall_precision": 0.7984293193717278, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4069, |
|
"eval_samples_per_second": 459.523, |
|
"eval_steps_per_second": 7.372, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.19695152342319489, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.011, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.75, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7037037037037037, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7692307692307693, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7051282051282052, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.22280381619930267, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.834924965893588, |
|
"eval_overall_precision": 0.7927461139896373, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4088, |
|
"eval_samples_per_second": 457.432, |
|
"eval_steps_per_second": 7.338, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.30122533440589905, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0107, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7552447552447553, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2211771309375763, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.834924965893588, |
|
"eval_overall_precision": 0.7927461139896373, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4094, |
|
"eval_samples_per_second": 456.814, |
|
"eval_steps_per_second": 7.329, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.1013573631644249, |
|
"learning_rate": 3e-06, |
|
"loss": 0.009, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7586206896551724, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2232343554496765, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8353741496598639, |
|
"eval_overall_precision": 0.7912371134020618, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.4075, |
|
"eval_samples_per_second": 458.923, |
|
"eval_steps_per_second": 7.362, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 1.0435041189193726, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0109, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.7450980392156863, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6951219512195121, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7552447552447553, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9120521172638437, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.89171974522293, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.22744058072566986, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8306010928961749, |
|
"eval_overall_precision": 0.7896103896103897, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.407, |
|
"eval_samples_per_second": 459.405, |
|
"eval_steps_per_second": 7.37, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 4.114624500274658, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0098, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7692307692307693, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7051282051282052, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.22330667078495026, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8387978142076504, |
|
"eval_overall_precision": 0.7974025974025974, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.4058, |
|
"eval_samples_per_second": 460.857, |
|
"eval_steps_per_second": 7.393, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.8480021953582764, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0103, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7125, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.22035245597362518, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8283378746594005, |
|
"eval_overall_precision": 0.7855297157622739, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.4072, |
|
"eval_samples_per_second": 459.182, |
|
"eval_steps_per_second": 7.367, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.7559491395950317, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0102, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.7682119205298014, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2218533307313919, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.834924965893588, |
|
"eval_overall_precision": 0.7927461139896373, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4081, |
|
"eval_samples_per_second": 458.203, |
|
"eval_steps_per_second": 7.351, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.24367158114910126, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0094, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.7549668874172185, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7125, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.22336292266845703, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8321964529331515, |
|
"eval_overall_precision": 0.7901554404145078, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.4081, |
|
"eval_samples_per_second": 458.197, |
|
"eval_steps_per_second": 7.351, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.0760447159409523, |
|
"learning_rate": 0.0, |
|
"loss": 0.0098, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.7682119205298014, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.22373317182064056, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.834924965893588, |
|
"eval_overall_precision": 0.7927461139896373, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.4055, |
|
"eval_samples_per_second": 461.127, |
|
"eval_steps_per_second": 7.398, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5189413292285520.0, |
|
"train_loss": 0.055730826843459653, |
|
"train_runtime": 962.8691, |
|
"train_samples_per_second": 175.309, |
|
"train_steps_per_second": 11.009 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5189413292285520.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|