|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 0.9845661520957947, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9292, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012903225806451613, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.3333333333333333, |
|
"eval_PERSON_recall": 0.006578947368421052, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.6127339601516724, |
|
"eval_overall_accuracy": 0.8399487836107554, |
|
"eval_overall_f1": 0.005865102639296187, |
|
"eval_overall_precision": 0.3333333333333333, |
|
"eval_overall_recall": 0.0029585798816568047, |
|
"eval_runtime": 0.7389, |
|
"eval_samples_per_second": 253.078, |
|
"eval_steps_per_second": 4.06, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.0367096662521362, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.5076, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.3577235772357724, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.4074074074074074, |
|
"eval_LOCATION_recall": 0.3188405797101449, |
|
"eval_ORGANIZATION_f1": 0.11235955056179776, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.16129032258064516, |
|
"eval_ORGANIZATION_recall": 0.08620689655172414, |
|
"eval_PERSON_f1": 0.6703601108033241, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.5789473684210527, |
|
"eval_PERSON_recall": 0.7960526315789473, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.4918032786885246, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.46875, |
|
"eval_TIME_recall": 0.5172413793103449, |
|
"eval_loss": 0.33459725975990295, |
|
"eval_overall_accuracy": 0.9044814340588988, |
|
"eval_overall_f1": 0.48082595870206496, |
|
"eval_overall_precision": 0.47941176470588237, |
|
"eval_overall_recall": 0.4822485207100592, |
|
"eval_runtime": 0.7528, |
|
"eval_samples_per_second": 248.397, |
|
"eval_steps_per_second": 3.985, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.3818385601043701, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.2907, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.6705882352941176, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5643564356435643, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.39682539682539686, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.36764705882352944, |
|
"eval_ORGANIZATION_recall": 0.43103448275862066, |
|
"eval_PERSON_f1": 0.8085106382978723, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.751412429378531, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.605263157894737, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5, |
|
"eval_QUANTITY_recall": 0.7666666666666667, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1991610825061798, |
|
"eval_overall_accuracy": 0.9323943661971831, |
|
"eval_overall_f1": 0.6885676741130091, |
|
"eval_overall_precision": 0.6193853427895981, |
|
"eval_overall_recall": 0.7751479289940828, |
|
"eval_runtime": 0.7451, |
|
"eval_samples_per_second": 250.989, |
|
"eval_steps_per_second": 4.027, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 2.382436513900757, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.1931, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6923076923076923, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6323529411764706, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5512820512820513, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.7896253602305474, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7025641025641025, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.6410256410256411, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5208333333333334, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.6133333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.5, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.190628781914711, |
|
"eval_overall_accuracy": 0.9352112676056338, |
|
"eval_overall_f1": 0.7311557788944725, |
|
"eval_overall_precision": 0.6353711790393013, |
|
"eval_overall_recall": 0.8609467455621301, |
|
"eval_runtime": 0.7563, |
|
"eval_samples_per_second": 247.259, |
|
"eval_steps_per_second": 3.967, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.9061810970306396, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1671, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.7832167832167832, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7567567567567568, |
|
"eval_LOCATION_recall": 0.8115942028985508, |
|
"eval_ORGANIZATION_f1": 0.6714285714285714, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.573170731707317, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8535825545171339, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8106508875739645, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7826086956521738, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13657993078231812, |
|
"eval_overall_accuracy": 0.953393085787452, |
|
"eval_overall_f1": 0.7978142076502731, |
|
"eval_overall_precision": 0.7411167512690355, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.768, |
|
"eval_samples_per_second": 243.498, |
|
"eval_steps_per_second": 3.906, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.6724838018417358, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1438, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7564102564102564, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6781609195402298, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6231884057971016, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5375, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8430769230769231, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.791907514450867, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7246376811594204, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.71875, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6571428571428571, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.13694226741790771, |
|
"eval_overall_accuracy": 0.9528809218950064, |
|
"eval_overall_f1": 0.7632978723404256, |
|
"eval_overall_precision": 0.6932367149758454, |
|
"eval_overall_recall": 0.849112426035503, |
|
"eval_runtime": 0.846, |
|
"eval_samples_per_second": 221.028, |
|
"eval_steps_per_second": 3.546, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.49843528866767883, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1337, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7712418300653594, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7023809523809523, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6557377049180328, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.8679245283018868, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12538817524909973, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.796116504854369, |
|
"eval_overall_precision": 0.7493472584856397, |
|
"eval_overall_recall": 0.849112426035503, |
|
"eval_runtime": 0.8252, |
|
"eval_samples_per_second": 226.607, |
|
"eval_steps_per_second": 3.635, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.4025654196739197, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1244, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.8275862068965517, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7894736842105263, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6825396825396826, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6323529411764706, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8769716088328074, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6470588235294118, |
|
"eval_QUANTITY_recall": 0.7333333333333333, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.12903648614883423, |
|
"eval_overall_accuracy": 0.9572343149807938, |
|
"eval_overall_f1": 0.8050490883590464, |
|
"eval_overall_precision": 0.7653333333333333, |
|
"eval_overall_recall": 0.849112426035503, |
|
"eval_runtime": 0.8305, |
|
"eval_samples_per_second": 225.153, |
|
"eval_steps_per_second": 3.612, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.2503007650375366, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1195, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.8243243243243245, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6285714285714286, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8598130841121495, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8165680473372781, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12411422282457352, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8093922651933702, |
|
"eval_overall_precision": 0.7590673575129534, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8548, |
|
"eval_samples_per_second": 218.761, |
|
"eval_steps_per_second": 3.51, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.5948196649551392, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1083, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6285714285714286, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8761904761904762, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12625408172607422, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8099861303744799, |
|
"eval_overall_precision": 0.762402088772846, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.9354, |
|
"eval_samples_per_second": 199.908, |
|
"eval_steps_per_second": 3.207, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.7792600393295288, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1025, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7441860465116279, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7040000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6567164179104478, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.64, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5333333333333333, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14459605515003204, |
|
"eval_overall_accuracy": 0.9551856594110115, |
|
"eval_overall_f1": 0.8071135430916553, |
|
"eval_overall_precision": 0.7506361323155216, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.9057, |
|
"eval_samples_per_second": 206.46, |
|
"eval_steps_per_second": 3.312, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.0304011106491089, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.0969, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6991869918699186, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6615384615384615, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1326281726360321, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8111888111888113, |
|
"eval_overall_precision": 0.7692307692307693, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.875, |
|
"eval_samples_per_second": 213.704, |
|
"eval_steps_per_second": 3.428, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.34425103664398193, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.0885, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.821917808219178, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7792207792207793, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.7040000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6567164179104478, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.11661401391029358, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8316831683168318, |
|
"eval_overall_precision": 0.7967479674796748, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8754, |
|
"eval_samples_per_second": 213.615, |
|
"eval_steps_per_second": 3.427, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.0210072994232178, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.0897, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.8322147651006713, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6825396825396826, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6323529411764706, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7272727272727273, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6486486486486487, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1263030618429184, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8099861303744799, |
|
"eval_overall_precision": 0.762402088772846, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.9149, |
|
"eval_samples_per_second": 204.387, |
|
"eval_steps_per_second": 3.279, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 0.7929083704948425, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.0847, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6721311475409836, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.640625, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12834492325782776, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8123249299719889, |
|
"eval_overall_precision": 0.7712765957446809, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.8739, |
|
"eval_samples_per_second": 213.989, |
|
"eval_steps_per_second": 3.433, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.8108320236206055, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0808, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8299319727891156, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.7040000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6567164179104478, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8874598070739551, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.761904761904762, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7272727272727273, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12765684723854065, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.826025459688826, |
|
"eval_overall_precision": 0.7913279132791328, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.8873, |
|
"eval_samples_per_second": 210.758, |
|
"eval_steps_per_second": 3.381, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.31881314516067505, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0746, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8266666666666668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7086614173228347, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6521739130434783, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8874598070739551, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13274899125099182, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8218793828892006, |
|
"eval_overall_precision": 0.7813333333333333, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8878, |
|
"eval_samples_per_second": 210.626, |
|
"eval_steps_per_second": 3.379, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 1.1737678050994873, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0715, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8671328671328672, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8726114649681528, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1314823478460312, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8215297450424929, |
|
"eval_overall_precision": 0.7880434782608695, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.8811, |
|
"eval_samples_per_second": 212.231, |
|
"eval_steps_per_second": 3.405, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.9921818971633911, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0695, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7213114754098361, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1310775727033615, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.8190743338008415, |
|
"eval_overall_precision": 0.7786666666666666, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.8843, |
|
"eval_samples_per_second": 211.462, |
|
"eval_steps_per_second": 3.392, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.8729901909828186, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0705, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.851063829787234, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8333333333333334, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8761904761904762, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13000606000423431, |
|
"eval_overall_accuracy": 0.9597951344430218, |
|
"eval_overall_f1": 0.8238636363636365, |
|
"eval_overall_precision": 0.7923497267759563, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.87, |
|
"eval_samples_per_second": 214.936, |
|
"eval_steps_per_second": 3.448, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 0.5570505857467651, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0623, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8590604026845639, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7076923076923076, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6388888888888888, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.89171974522293, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14154018461704254, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.8347338935574229, |
|
"eval_overall_precision": 0.7925531914893617, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.892, |
|
"eval_samples_per_second": 209.65, |
|
"eval_steps_per_second": 3.363, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.4297601878643036, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0636, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8366013071895425, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.706766917293233, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6266666666666667, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8761904761904762, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7812500000000001, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14867202937602997, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8175582990397806, |
|
"eval_overall_precision": 0.7621483375959079, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8724, |
|
"eval_samples_per_second": 214.362, |
|
"eval_steps_per_second": 3.439, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.4904947876930237, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0571, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8591549295774648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8356164383561644, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.7131782945736435, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8607594936708861, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1371629238128662, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8283687943262411, |
|
"eval_overall_precision": 0.7956403269754768, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.8758, |
|
"eval_samples_per_second": 213.508, |
|
"eval_steps_per_second": 3.425, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 0.8735907673835754, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0574, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.696969696969697, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8881789137380192, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8275862068965517, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14183317124843597, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8286516853932584, |
|
"eval_overall_precision": 0.7887700534759359, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.876, |
|
"eval_samples_per_second": 213.47, |
|
"eval_steps_per_second": 3.425, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.4508860409259796, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0542, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8671328671328672, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7272727272727273, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6984126984126984, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8817891373801917, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13426989316940308, |
|
"eval_overall_accuracy": 0.9633802816901409, |
|
"eval_overall_f1": 0.84, |
|
"eval_overall_precision": 0.8121546961325967, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8752, |
|
"eval_samples_per_second": 213.654, |
|
"eval_steps_per_second": 3.428, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.8999614715576172, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0526, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8652482269503546, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8472222222222222, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.7540983606557378, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.71875, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.761904761904762, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7272727272727273, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1440158635377884, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8412017167381973, |
|
"eval_overall_precision": 0.814404432132964, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8876, |
|
"eval_samples_per_second": 210.689, |
|
"eval_steps_per_second": 3.38, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.6169599890708923, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0477, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7142857142857142, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6617647058823529, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8662420382165605, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.16048064827919006, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8241912798874824, |
|
"eval_overall_precision": 0.7855227882037533, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8784, |
|
"eval_samples_per_second": 212.876, |
|
"eval_steps_per_second": 3.415, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 0.5325952768325806, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.048, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8671328671328672, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7086614173228347, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6521739130434783, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1558757722377777, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.830028328611898, |
|
"eval_overall_precision": 0.7961956521739131, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8788, |
|
"eval_samples_per_second": 212.794, |
|
"eval_steps_per_second": 3.414, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.5985626578330994, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0481, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7007299270072993, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6075949367088608, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.15555179119110107, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8282548476454293, |
|
"eval_overall_precision": 0.7786458333333334, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.8856, |
|
"eval_samples_per_second": 211.154, |
|
"eval_steps_per_second": 3.387, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.8177056908607483, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.045, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7068965517241379, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7068965517241379, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.761904761904762, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7272727272727273, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1506585329771042, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8342857142857144, |
|
"eval_overall_precision": 0.8066298342541437, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.8833, |
|
"eval_samples_per_second": 211.711, |
|
"eval_steps_per_second": 3.396, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.42287537455558777, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0445, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8590604026845639, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7343749999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8874598070739551, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.15119028091430664, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8330995792426368, |
|
"eval_overall_precision": 0.792, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8769, |
|
"eval_samples_per_second": 213.246, |
|
"eval_steps_per_second": 3.421, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.3716237246990204, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.042, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.716417910447761, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.631578947368421, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.877742946708464, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8383233532934131, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1590593457221985, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8303448275862069, |
|
"eval_overall_precision": 0.7777777777777778, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.8744, |
|
"eval_samples_per_second": 213.872, |
|
"eval_steps_per_second": 3.431, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.18944571912288666, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0394, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7040000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6567164179104478, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1586446911096573, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8276836158192091, |
|
"eval_overall_precision": 0.7918918918918919, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8776, |
|
"eval_samples_per_second": 213.07, |
|
"eval_steps_per_second": 3.418, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.3505786657333374, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0378, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7131782945736435, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.15407726168632507, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8291316526610645, |
|
"eval_overall_precision": 0.7872340425531915, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8762, |
|
"eval_samples_per_second": 213.42, |
|
"eval_steps_per_second": 3.424, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.631050705909729, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0375, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6725663716814159, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6909090909090909, |
|
"eval_ORGANIZATION_recall": 0.6551724137931034, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.15462984144687653, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8309455587392551, |
|
"eval_overall_precision": 0.8055555555555556, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.8693, |
|
"eval_samples_per_second": 215.126, |
|
"eval_steps_per_second": 3.451, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.13165172934532166, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0384, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.879746835443038, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.761904761904762, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7272727272727273, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.16041359305381775, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.84375, |
|
"eval_overall_precision": 0.8114754098360656, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8806, |
|
"eval_samples_per_second": 212.356, |
|
"eval_steps_per_second": 3.407, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.39163538813591003, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0337, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7166666666666668, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6935483870967742, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.16409936547279358, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8421052631578948, |
|
"eval_overall_precision": 0.810958904109589, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8782, |
|
"eval_samples_per_second": 212.924, |
|
"eval_steps_per_second": 3.416, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 1.8893556594848633, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0327, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1764567792415619, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8316831683168318, |
|
"eval_overall_precision": 0.7967479674796748, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8812, |
|
"eval_samples_per_second": 212.213, |
|
"eval_steps_per_second": 3.404, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 1.0850064754486084, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.033, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.16998325288295746, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8323863636363636, |
|
"eval_overall_precision": 0.8005464480874317, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8888, |
|
"eval_samples_per_second": 210.391, |
|
"eval_steps_per_second": 3.375, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.8192635774612427, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0333, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8493150684931507, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7200000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6716417910447762, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.17454804480075836, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8312056737588652, |
|
"eval_overall_precision": 0.7983651226158038, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8709, |
|
"eval_samples_per_second": 214.732, |
|
"eval_steps_per_second": 3.445, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 1.14230477809906, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0296, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.851063829787234, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8333333333333334, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.7086614173228347, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6521739130434783, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8662420382165605, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.17790456116199493, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8283687943262411, |
|
"eval_overall_precision": 0.7956403269754768, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.8959, |
|
"eval_samples_per_second": 208.739, |
|
"eval_steps_per_second": 3.349, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 1.1531621217727661, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0305, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.851063829787234, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8333333333333334, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6176470588235294, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8874598070739551, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1733568161725998, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8297567954220315, |
|
"eval_overall_precision": 0.8033240997229917, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.8898, |
|
"eval_samples_per_second": 210.16, |
|
"eval_steps_per_second": 3.372, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.12765854597091675, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.029, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.8591549295774648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8356164383561644, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.7401574803149606, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6811594202898551, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8782051282051281, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.18485189974308014, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8368794326241134, |
|
"eval_overall_precision": 0.8038147138964578, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8698, |
|
"eval_samples_per_second": 214.991, |
|
"eval_steps_per_second": 3.449, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.6099337935447693, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0289, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6942148760330579, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8553459119496856, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.170259490609169, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.833810888252149, |
|
"eval_overall_precision": 0.8083333333333333, |
|
"eval_overall_recall": 0.8609467455621301, |
|
"eval_runtime": 0.8888, |
|
"eval_samples_per_second": 210.406, |
|
"eval_steps_per_second": 3.375, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.0691465139389038, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0294, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8413793103448277, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8026315789473685, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.7540983606557378, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.71875, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8782051282051281, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1816970556974411, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8352272727272727, |
|
"eval_overall_precision": 0.8032786885245902, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8854, |
|
"eval_samples_per_second": 211.192, |
|
"eval_steps_per_second": 3.388, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.2375423014163971, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0262, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7213114754098361, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8874598070739551, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1889667958021164, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8392603129445234, |
|
"eval_overall_precision": 0.8082191780821918, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8885, |
|
"eval_samples_per_second": 210.463, |
|
"eval_steps_per_second": 3.376, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.48538097739219666, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0261, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7438016528925621, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7142857142857143, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8838709677419354, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.18387795984745026, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8464849354375897, |
|
"eval_overall_precision": 0.8217270194986073, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8841, |
|
"eval_samples_per_second": 211.519, |
|
"eval_steps_per_second": 3.393, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 1.2411327362060547, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.027, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7343749999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8838709677419354, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.18413321673870087, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8389830508474576, |
|
"eval_overall_precision": 0.8027027027027027, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8687, |
|
"eval_samples_per_second": 215.275, |
|
"eval_steps_per_second": 3.454, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 1.1320481300354004, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0243, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.8652482269503546, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8472222222222222, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.717948717948718, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.711864406779661, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.18021155893802643, |
|
"eval_overall_accuracy": 0.9628681177976952, |
|
"eval_overall_f1": 0.8405797101449276, |
|
"eval_overall_precision": 0.8238636363636364, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.8873, |
|
"eval_samples_per_second": 210.759, |
|
"eval_steps_per_second": 3.381, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.6338851451873779, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0243, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7040000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6567164179104478, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1869899332523346, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8345120226308346, |
|
"eval_overall_precision": 0.7994579945799458, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8731, |
|
"eval_samples_per_second": 214.182, |
|
"eval_steps_per_second": 3.436, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 2.7834653854370117, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0256, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7022900763358779, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6301369863013698, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8838709677419354, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.19200466573238373, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8356940509915014, |
|
"eval_overall_precision": 0.8016304347826086, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8812, |
|
"eval_samples_per_second": 212.219, |
|
"eval_steps_per_second": 3.405, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.22858576476573944, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0233, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8611111111111112, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.716417910447761, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.631578947368421, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7931034482758621, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7931034482758621, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.19999483227729797, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8302945301542777, |
|
"eval_overall_precision": 0.7893333333333333, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8802, |
|
"eval_samples_per_second": 212.441, |
|
"eval_steps_per_second": 3.408, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 1.8902926445007324, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0233, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.853146853146853, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8243243243243243, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6923076923076923, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.19701984524726868, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.8265162200282087, |
|
"eval_overall_precision": 0.7897574123989218, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8753, |
|
"eval_samples_per_second": 213.637, |
|
"eval_steps_per_second": 3.427, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.5953955054283142, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0211, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7200000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6716417910447762, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.8064516129032259, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.78125, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.21723441779613495, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8293370944992947, |
|
"eval_overall_precision": 0.7924528301886793, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8826, |
|
"eval_samples_per_second": 211.865, |
|
"eval_steps_per_second": 3.399, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 2.6492440700531006, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0217, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6507936507936507, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6029411764705882, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8838709677419354, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.8064516129032259, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.78125, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.19644935429096222, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.829059829059829, |
|
"eval_overall_precision": 0.7994505494505495, |
|
"eval_overall_recall": 0.8609467455621301, |
|
"eval_runtime": 0.8838, |
|
"eval_samples_per_second": 211.588, |
|
"eval_steps_per_second": 3.394, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.8844048380851746, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0214, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7096774193548386, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8817891373801917, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.8064516129032259, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.78125, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.20219193398952484, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8404558404558404, |
|
"eval_overall_precision": 0.8104395604395604, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8832, |
|
"eval_samples_per_second": 211.741, |
|
"eval_steps_per_second": 3.397, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.3619399666786194, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0197, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8493150684931507, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7049180327868853, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.671875, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8734177215189873, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.20077820122241974, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.8330955777460769, |
|
"eval_overall_precision": 0.8044077134986226, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.9531, |
|
"eval_samples_per_second": 196.195, |
|
"eval_steps_per_second": 3.148, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.1735541820526123, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0216, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7131782945736435, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8782051282051281, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.21140815317630768, |
|
"eval_overall_accuracy": 0.9597951344430218, |
|
"eval_overall_f1": 0.8333333333333334, |
|
"eval_overall_precision": 0.7972972972972973, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8863, |
|
"eval_samples_per_second": 210.995, |
|
"eval_steps_per_second": 3.385, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.837820291519165, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0197, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7244094488188977, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.20840610563755035, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8389830508474576, |
|
"eval_overall_precision": 0.8027027027027027, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8868, |
|
"eval_samples_per_second": 210.865, |
|
"eval_steps_per_second": 3.383, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.5633171796798706, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0182, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7286821705426356, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8726114649681528, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21587228775024414, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8370786516853933, |
|
"eval_overall_precision": 0.7967914438502673, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8748, |
|
"eval_samples_per_second": 213.775, |
|
"eval_steps_per_second": 3.43, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.4832909405231476, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0196, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7200000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6716417910447762, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.20733201503753662, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8425531914893617, |
|
"eval_overall_precision": 0.8092643051771117, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.9535, |
|
"eval_samples_per_second": 196.123, |
|
"eval_steps_per_second": 3.146, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.6487990617752075, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0176, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8671328671328672, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7213114754098361, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8769716088328074, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7931034482758621, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7931034482758621, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.20125307142734528, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8335704125177809, |
|
"eval_overall_precision": 0.8027397260273973, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8874, |
|
"eval_samples_per_second": 210.718, |
|
"eval_steps_per_second": 3.38, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.8727775812149048, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0157, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8356164383561644, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7922077922077922, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6833333333333333, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6612903225806451, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8838709677419354, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.8064516129032259, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.78125, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.20443986356258392, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.828080229226361, |
|
"eval_overall_precision": 0.8027777777777778, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.8782, |
|
"eval_samples_per_second": 212.933, |
|
"eval_steps_per_second": 3.416, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 1.5122424364089966, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0177, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8476821192052981, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7175572519083969, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6438356164383562, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8652037617554859, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8263473053892215, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.22791583836078644, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8298755186721992, |
|
"eval_overall_precision": 0.7792207792207793, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.8723, |
|
"eval_samples_per_second": 214.372, |
|
"eval_steps_per_second": 3.439, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.5700312852859497, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0165, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.8493150684931507, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.761904761904762, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7272727272727273, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.21637500822544098, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8265162200282087, |
|
"eval_overall_precision": 0.7897574123989218, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.8725, |
|
"eval_samples_per_second": 214.338, |
|
"eval_steps_per_second": 3.439, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.9781705737113953, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0171, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.746031746031746, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6911764705882353, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21887072920799255, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8426966292134831, |
|
"eval_overall_precision": 0.8021390374331551, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.8649, |
|
"eval_samples_per_second": 216.219, |
|
"eval_steps_per_second": 3.469, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.7777842879295349, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0167, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.8590604026845639, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7286821705426356, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8832807570977917, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7812500000000001, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.23059594631195068, |
|
"eval_overall_accuracy": 0.9597951344430218, |
|
"eval_overall_f1": 0.8337950138504154, |
|
"eval_overall_precision": 0.7838541666666666, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.8828, |
|
"eval_samples_per_second": 211.834, |
|
"eval_steps_per_second": 3.398, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.42934471368789673, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0156, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7580645161290323, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7121212121212122, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.8064516129032259, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.78125, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21977542340755463, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8498583569405098, |
|
"eval_overall_precision": 0.8152173913043478, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.8618, |
|
"eval_samples_per_second": 216.978, |
|
"eval_steps_per_second": 3.481, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 1.0344369411468506, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0156, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8590604026845639, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7175572519083969, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6438356164383562, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8734177215189873, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.21617823839187622, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8398876404494382, |
|
"eval_overall_precision": 0.7994652406417112, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.8721, |
|
"eval_samples_per_second": 214.436, |
|
"eval_steps_per_second": 3.44, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 1.9640426635742188, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0155, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8421052631578948, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7086614173228347, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6521739130434783, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8797468354430381, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.22830812633037567, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.83008356545961, |
|
"eval_overall_precision": 0.7842105263157895, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8737, |
|
"eval_samples_per_second": 214.022, |
|
"eval_steps_per_second": 3.434, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.16448061168193817, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0142, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6911764705882352, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6025641025641025, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8782051282051281, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2332638055086136, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.83008356545961, |
|
"eval_overall_precision": 0.7842105263157895, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8749, |
|
"eval_samples_per_second": 213.733, |
|
"eval_steps_per_second": 3.429, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.25591084361076355, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0165, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7401574803149606, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6811594202898551, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8553459119496856, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.8253968253968254, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7878787878787878, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2185453474521637, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8429985855728428, |
|
"eval_overall_precision": 0.8075880758807588, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8809, |
|
"eval_samples_per_second": 212.292, |
|
"eval_steps_per_second": 3.406, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.047924935817718506, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0145, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8607594936708861, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.8253968253968254, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7878787878787878, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.22260642051696777, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8352272727272727, |
|
"eval_overall_precision": 0.8032786885245902, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8798, |
|
"eval_samples_per_second": 212.544, |
|
"eval_steps_per_second": 3.41, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 0.29497218132019043, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0135, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2320089489221573, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8316831683168318, |
|
"eval_overall_precision": 0.7967479674796748, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8782, |
|
"eval_samples_per_second": 212.931, |
|
"eval_steps_per_second": 3.416, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.01762392371892929, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0138, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7286821705426356, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8789808917197451, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.2413773536682129, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8324022346368716, |
|
"eval_overall_precision": 0.7883597883597884, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.883, |
|
"eval_samples_per_second": 211.783, |
|
"eval_steps_per_second": 3.398, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.21732616424560547, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0129, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7213114754098361, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.8387096774193549, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.8125, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.22952446341514587, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8473609129814551, |
|
"eval_overall_precision": 0.8181818181818182, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8794, |
|
"eval_samples_per_second": 212.653, |
|
"eval_steps_per_second": 3.412, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.42748743295669556, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0118, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8322147651006713, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.23922854661941528, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8319327731092437, |
|
"eval_overall_precision": 0.7898936170212766, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8708, |
|
"eval_samples_per_second": 214.745, |
|
"eval_steps_per_second": 3.445, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.6394297480583191, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0127, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6865671641791045, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.2345399558544159, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8433048433048432, |
|
"eval_overall_precision": 0.8131868131868132, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8826, |
|
"eval_samples_per_second": 211.871, |
|
"eval_steps_per_second": 3.399, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.5575834512710571, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0122, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.746031746031746, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6911764705882353, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.24232904613018036, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.8410689170182841, |
|
"eval_overall_precision": 0.8016085790884718, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.8823, |
|
"eval_samples_per_second": 211.957, |
|
"eval_steps_per_second": 3.4, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.14352549612522125, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0117, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.881118881118881, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8513513513513513, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7317073170731708, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8782051282051281, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8275862068965517, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.22932307422161102, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8412017167381973, |
|
"eval_overall_precision": 0.814404432132964, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.882, |
|
"eval_samples_per_second": 212.026, |
|
"eval_steps_per_second": 3.401, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.47307726740837097, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.012, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8881789137380192, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.761904761904762, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7272727272727273, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.23925283551216125, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8370786516853933, |
|
"eval_overall_precision": 0.7967914438502673, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8824, |
|
"eval_samples_per_second": 211.922, |
|
"eval_steps_per_second": 3.4, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.2593061923980713, |
|
"learning_rate": 9e-06, |
|
"loss": 0.013, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7333333333333333, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7096774193548387, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.23163729906082153, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.8404558404558404, |
|
"eval_overall_precision": 0.8104395604395604, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8706, |
|
"eval_samples_per_second": 214.791, |
|
"eval_steps_per_second": 3.446, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.8594510555267334, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0115, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.8435374149659864, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7948717948717948, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7096774193548386, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8874598070739551, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.23205186426639557, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8380681818181818, |
|
"eval_overall_precision": 0.8060109289617486, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.8704, |
|
"eval_samples_per_second": 214.832, |
|
"eval_steps_per_second": 3.447, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.06097917631268501, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0124, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7107438016528926, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6825396825396826, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.891025641025641, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.23106266558170319, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8433048433048432, |
|
"eval_overall_precision": 0.8131868131868132, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8817, |
|
"eval_samples_per_second": 212.094, |
|
"eval_steps_per_second": 3.403, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.0979015976190567, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0118, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7096774193548386, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.24057278037071228, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8328611898016997, |
|
"eval_overall_precision": 0.7989130434782609, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.9001, |
|
"eval_samples_per_second": 207.748, |
|
"eval_steps_per_second": 3.333, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 2.0524749755859375, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0115, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7317073170731708, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8817891373801917, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.23790757358074188, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8373408769448374, |
|
"eval_overall_precision": 0.8021680216802168, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8768, |
|
"eval_samples_per_second": 213.284, |
|
"eval_steps_per_second": 3.422, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.27762410044670105, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0116, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7419354838709677, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.696969696969697, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.8064516129032259, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.78125, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.23644272983074188, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8453900709219858, |
|
"eval_overall_precision": 0.8119891008174387, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8829, |
|
"eval_samples_per_second": 211.807, |
|
"eval_steps_per_second": 3.398, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.8406667709350586, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0107, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7272727272727273, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6984126984126984, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2356145679950714, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8412017167381973, |
|
"eval_overall_precision": 0.814404432132964, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.8796, |
|
"eval_samples_per_second": 212.593, |
|
"eval_steps_per_second": 3.411, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.5086352825164795, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0099, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8874598070739551, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2441495656967163, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8413597733711048, |
|
"eval_overall_precision": 0.8070652173913043, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8816, |
|
"eval_samples_per_second": 212.126, |
|
"eval_steps_per_second": 3.403, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.11222498118877411, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0116, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.8064516129032259, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.78125, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.24032947421073914, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8470254957507082, |
|
"eval_overall_precision": 0.8125, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.8666, |
|
"eval_samples_per_second": 215.798, |
|
"eval_steps_per_second": 3.462, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 1.0016977787017822, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0101, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6865671641791045, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.891025641025641, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.24104949831962585, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.84822695035461, |
|
"eval_overall_precision": 0.8147138964577657, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.8925, |
|
"eval_samples_per_second": 209.524, |
|
"eval_steps_per_second": 3.361, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.5980203151702881, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0104, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7377049180327868, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.703125, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.891025641025641, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.2380075305700302, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8421052631578948, |
|
"eval_overall_precision": 0.810958904109589, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.9541, |
|
"eval_samples_per_second": 195.995, |
|
"eval_steps_per_second": 3.144, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.1031588539481163, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0113, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.23934581875801086, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8409090909090909, |
|
"eval_overall_precision": 0.8087431693989071, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.9053, |
|
"eval_samples_per_second": 206.559, |
|
"eval_steps_per_second": 3.314, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 1.1558283567428589, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0104, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.2401016503572464, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8421052631578948, |
|
"eval_overall_precision": 0.810958904109589, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8815, |
|
"eval_samples_per_second": 212.144, |
|
"eval_steps_per_second": 3.403, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 1.1983808279037476, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0108, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8493150684931507, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.746031746031746, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6911764705882353, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.2409784197807312, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8425531914893617, |
|
"eval_overall_precision": 0.8092643051771117, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8891, |
|
"eval_samples_per_second": 210.332, |
|
"eval_steps_per_second": 3.374, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 1.2160520553588867, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0102, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7200000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6716417910447762, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2440604716539383, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.840620592383639, |
|
"eval_overall_precision": 0.8032345013477089, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.9399, |
|
"eval_samples_per_second": 198.966, |
|
"eval_steps_per_second": 3.192, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 1.8695564270019531, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0099, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.891025641025641, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.24207578599452972, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8453900709219858, |
|
"eval_overall_precision": 0.8119891008174387, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8801, |
|
"eval_samples_per_second": 212.469, |
|
"eval_steps_per_second": 3.409, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.15321999788284302, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.009, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.891025641025641, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.24271713197231293, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8453900709219858, |
|
"eval_overall_precision": 0.8119891008174387, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.8771, |
|
"eval_samples_per_second": 213.205, |
|
"eval_steps_per_second": 3.42, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.49585482478141785, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0096, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7096774193548386, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.891025641025641, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.24335408210754395, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8413597733711048, |
|
"eval_overall_precision": 0.8070652173913043, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.8907, |
|
"eval_samples_per_second": 209.939, |
|
"eval_steps_per_second": 3.368, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.202548086643219, |
|
"learning_rate": 0.0, |
|
"loss": 0.0099, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7096774193548386, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8846153846153847, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.24319376051425934, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8385269121813032, |
|
"eval_overall_precision": 0.8043478260869565, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.8912, |
|
"eval_samples_per_second": 209.818, |
|
"eval_steps_per_second": 3.366, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5072850468719490.0, |
|
"train_loss": 0.05464491794694145, |
|
"train_runtime": 1550.8875, |
|
"train_samples_per_second": 108.776, |
|
"train_steps_per_second": 6.835 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5072850468719490.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|