|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 0.9931251406669617, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 1.1468, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.0, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.0, |
|
"eval_PERSON_recall": 0.0, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.6908976435661316, |
|
"eval_overall_accuracy": 0.8396927016645327, |
|
"eval_overall_f1": 0.0, |
|
"eval_overall_precision": 0.0, |
|
"eval_overall_recall": 0.0, |
|
"eval_runtime": 0.2964, |
|
"eval_samples_per_second": 630.963, |
|
"eval_steps_per_second": 10.122, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.672861933708191, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.6623, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.08235294117647059, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.3888888888888889, |
|
"eval_PERSON_recall": 0.046052631578947366, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.5531525015830994, |
|
"eval_overall_accuracy": 0.8432778489116517, |
|
"eval_overall_f1": 0.03921568627450981, |
|
"eval_overall_precision": 0.3684210526315789, |
|
"eval_overall_recall": 0.020710059171597635, |
|
"eval_runtime": 0.2895, |
|
"eval_samples_per_second": 645.874, |
|
"eval_steps_per_second": 10.362, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.7515860795974731, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.5401, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.05263157894736841, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.2857142857142857, |
|
"eval_LOCATION_recall": 0.028985507246376812, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.37722419928825623, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.4108527131782946, |
|
"eval_PERSON_recall": 0.34868421052631576, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.2727272727272727, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.4, |
|
"eval_TIME_recall": 0.20689655172413793, |
|
"eval_loss": 0.4444293677806854, |
|
"eval_overall_accuracy": 0.8747759282970551, |
|
"eval_overall_f1": 0.24206349206349204, |
|
"eval_overall_precision": 0.3674698795180723, |
|
"eval_overall_recall": 0.1804733727810651, |
|
"eval_runtime": 0.2905, |
|
"eval_samples_per_second": 643.756, |
|
"eval_steps_per_second": 10.328, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.807163953781128, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.4414, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.30630630630630634, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.40476190476190477, |
|
"eval_LOCATION_recall": 0.2463768115942029, |
|
"eval_ORGANIZATION_f1": 0.022222222222222223, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.03125, |
|
"eval_ORGANIZATION_recall": 0.017241379310344827, |
|
"eval_PERSON_f1": 0.5571030640668524, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.4830917874396135, |
|
"eval_PERSON_recall": 0.6578947368421053, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.509090909090909, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.5384615384615384, |
|
"eval_TIME_recall": 0.4827586206896552, |
|
"eval_loss": 0.35881680250167847, |
|
"eval_overall_accuracy": 0.8988476312419974, |
|
"eval_overall_f1": 0.39759036144578314, |
|
"eval_overall_precision": 0.4049079754601227, |
|
"eval_overall_recall": 0.3905325443786982, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.765, |
|
"eval_steps_per_second": 10.248, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.5580129623413086, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.3745, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.4671532846715329, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.47058823529411764, |
|
"eval_LOCATION_recall": 0.463768115942029, |
|
"eval_ORGANIZATION_f1": 0.16326530612244897, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.2, |
|
"eval_ORGANIZATION_recall": 0.13793103448275862, |
|
"eval_PERSON_f1": 0.6477272727272728, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.57, |
|
"eval_PERSON_recall": 0.75, |
|
"eval_QUANTITY_f1": 0.3125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.29411764705882354, |
|
"eval_QUANTITY_recall": 0.3333333333333333, |
|
"eval_TIME_f1": 0.5901639344262296, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.5625, |
|
"eval_TIME_recall": 0.6206896551724138, |
|
"eval_loss": 0.31193920969963074, |
|
"eval_overall_accuracy": 0.9157490396927017, |
|
"eval_overall_f1": 0.5112359550561797, |
|
"eval_overall_precision": 0.48663101604278075, |
|
"eval_overall_recall": 0.5384615384615384, |
|
"eval_runtime": 0.2915, |
|
"eval_samples_per_second": 641.473, |
|
"eval_steps_per_second": 10.291, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.159395694732666, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.3306, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.576923076923077, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5172413793103449, |
|
"eval_LOCATION_recall": 0.6521739130434783, |
|
"eval_ORGANIZATION_f1": 0.3883495145631068, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.4444444444444444, |
|
"eval_ORGANIZATION_recall": 0.3448275862068966, |
|
"eval_PERSON_f1": 0.696883852691218, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.6119402985074627, |
|
"eval_PERSON_recall": 0.8092105263157895, |
|
"eval_QUANTITY_f1": 0.4117647058823529, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.3684210526315789, |
|
"eval_QUANTITY_recall": 0.4666666666666667, |
|
"eval_TIME_f1": 0.7931034482758621, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7931034482758621, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.275112509727478, |
|
"eval_overall_accuracy": 0.9270166453265045, |
|
"eval_overall_f1": 0.6097560975609756, |
|
"eval_overall_precision": 0.5625, |
|
"eval_overall_recall": 0.665680473372781, |
|
"eval_runtime": 0.2917, |
|
"eval_samples_per_second": 640.987, |
|
"eval_steps_per_second": 10.283, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.7062077522277832, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.2898, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.6455696202531644, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5730337078651685, |
|
"eval_LOCATION_recall": 0.7391304347826086, |
|
"eval_ORGANIZATION_f1": 0.4761904761904762, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5319148936170213, |
|
"eval_ORGANIZATION_recall": 0.43103448275862066, |
|
"eval_PERSON_f1": 0.7624633431085044, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.6878306878306878, |
|
"eval_PERSON_recall": 0.8552631578947368, |
|
"eval_QUANTITY_f1": 0.5142857142857143, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.45, |
|
"eval_QUANTITY_recall": 0.6, |
|
"eval_TIME_f1": 0.8275862068965517, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.24487873911857605, |
|
"eval_overall_accuracy": 0.9346991037131882, |
|
"eval_overall_f1": 0.6775956284153006, |
|
"eval_overall_precision": 0.6294416243654822, |
|
"eval_overall_recall": 0.7337278106508875, |
|
"eval_runtime": 0.2925, |
|
"eval_samples_per_second": 639.305, |
|
"eval_steps_per_second": 10.256, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.7220238447189331, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.2565, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.6540880503144654, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5777777777777777, |
|
"eval_LOCATION_recall": 0.7536231884057971, |
|
"eval_ORGANIZATION_f1": 0.47457627118644075, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.4666666666666667, |
|
"eval_ORGANIZATION_recall": 0.4827586206896552, |
|
"eval_PERSON_f1": 0.7751479289940829, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7043010752688172, |
|
"eval_PERSON_recall": 0.8618421052631579, |
|
"eval_QUANTITY_f1": 0.5, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.42857142857142855, |
|
"eval_QUANTITY_recall": 0.6, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.22170113027095795, |
|
"eval_overall_accuracy": 0.9357234314980793, |
|
"eval_overall_f1": 0.6801075268817205, |
|
"eval_overall_precision": 0.6231527093596059, |
|
"eval_overall_recall": 0.7485207100591716, |
|
"eval_runtime": 0.2922, |
|
"eval_samples_per_second": 639.883, |
|
"eval_steps_per_second": 10.266, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.7445695400238037, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.2355, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7051282051282052, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.632183908045977, |
|
"eval_LOCATION_recall": 0.7971014492753623, |
|
"eval_ORGANIZATION_f1": 0.4642857142857143, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.48148148148148145, |
|
"eval_ORGANIZATION_recall": 0.4482758620689655, |
|
"eval_PERSON_f1": 0.8012048192771084, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7388888888888889, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.49315068493150693, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.4186046511627907, |
|
"eval_QUANTITY_recall": 0.6, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.19788858294487, |
|
"eval_overall_accuracy": 0.9413572343149808, |
|
"eval_overall_f1": 0.7013698630136985, |
|
"eval_overall_precision": 0.6530612244897959, |
|
"eval_overall_recall": 0.757396449704142, |
|
"eval_runtime": 0.2915, |
|
"eval_samples_per_second": 641.404, |
|
"eval_steps_per_second": 10.29, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.1619913578033447, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.2102, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7272727272727274, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6588235294117647, |
|
"eval_LOCATION_recall": 0.8115942028985508, |
|
"eval_ORGANIZATION_f1": 0.4736842105263158, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.48214285714285715, |
|
"eval_ORGANIZATION_recall": 0.46551724137931033, |
|
"eval_PERSON_f1": 0.8098159509202454, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7586206896551724, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.5142857142857143, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.45, |
|
"eval_QUANTITY_recall": 0.6, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.18124544620513916, |
|
"eval_overall_accuracy": 0.9441741357234315, |
|
"eval_overall_f1": 0.7128987517337032, |
|
"eval_overall_precision": 0.6710182767624021, |
|
"eval_overall_recall": 0.7603550295857988, |
|
"eval_runtime": 0.2938, |
|
"eval_samples_per_second": 636.52, |
|
"eval_steps_per_second": 10.212, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 1.1275286674499512, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1959, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7169811320754716, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6333333333333333, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.4833333333333333, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.46774193548387094, |
|
"eval_ORGANIZATION_recall": 0.5, |
|
"eval_PERSON_f1": 0.7975830815709969, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7374301675977654, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.5428571428571427, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.475, |
|
"eval_QUANTITY_recall": 0.6333333333333333, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1784009039402008, |
|
"eval_overall_accuracy": 0.9441741357234315, |
|
"eval_overall_f1": 0.7108108108108109, |
|
"eval_overall_precision": 0.654228855721393, |
|
"eval_overall_recall": 0.7781065088757396, |
|
"eval_runtime": 0.293, |
|
"eval_samples_per_second": 638.276, |
|
"eval_steps_per_second": 10.24, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 2.0943050384521484, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1851, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.7549668874172186, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6951219512195121, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.5, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5, |
|
"eval_ORGANIZATION_recall": 0.5, |
|
"eval_PERSON_f1": 0.8098159509202454, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7586206896551724, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.5428571428571427, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.475, |
|
"eval_QUANTITY_recall": 0.6333333333333333, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1627739518880844, |
|
"eval_overall_accuracy": 0.9477592829705506, |
|
"eval_overall_f1": 0.7257617728531854, |
|
"eval_overall_precision": 0.6822916666666666, |
|
"eval_overall_recall": 0.7751479289940828, |
|
"eval_runtime": 0.2924, |
|
"eval_samples_per_second": 639.503, |
|
"eval_steps_per_second": 10.259, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.8063132166862488, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1722, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.7763157894736842, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7108433734939759, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.4869565217391304, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.49122807017543857, |
|
"eval_ORGANIZATION_recall": 0.4827586206896552, |
|
"eval_PERSON_f1": 0.8024316109422492, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7457627118644068, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.6470588235294117, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5789473684210527, |
|
"eval_QUANTITY_recall": 0.7333333333333333, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.15798519551753998, |
|
"eval_overall_accuracy": 0.9477592829705506, |
|
"eval_overall_f1": 0.7375690607734806, |
|
"eval_overall_precision": 0.6917098445595855, |
|
"eval_overall_recall": 0.7899408284023669, |
|
"eval_runtime": 0.2918, |
|
"eval_samples_per_second": 640.94, |
|
"eval_steps_per_second": 10.282, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.4455363750457764, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1681, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7581699346405228, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6904761904761905, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.5581395348837208, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5070422535211268, |
|
"eval_ORGANIZATION_recall": 0.6206896551724138, |
|
"eval_PERSON_f1": 0.8148148148148148, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7674418604651163, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.7246376811594204, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.16039857268333435, |
|
"eval_overall_accuracy": 0.9495518565941101, |
|
"eval_overall_f1": 0.7510204081632653, |
|
"eval_overall_precision": 0.6952141057934509, |
|
"eval_overall_recall": 0.8165680473372781, |
|
"eval_runtime": 0.2865, |
|
"eval_samples_per_second": 652.766, |
|
"eval_steps_per_second": 10.472, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.1877578496932983, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1581, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.7814569536423841, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.5499999999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.532258064516129, |
|
"eval_ORGANIZATION_recall": 0.5689655172413793, |
|
"eval_PERSON_f1": 0.8161993769470405, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7751479289940828, |
|
"eval_PERSON_recall": 0.8618421052631579, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.847457627118644, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1485019475221634, |
|
"eval_overall_accuracy": 0.952112676056338, |
|
"eval_overall_f1": 0.7576601671309192, |
|
"eval_overall_precision": 0.7157894736842105, |
|
"eval_overall_recall": 0.8047337278106509, |
|
"eval_runtime": 0.2924, |
|
"eval_samples_per_second": 639.644, |
|
"eval_steps_per_second": 10.262, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.9984870553016663, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1542, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.802721088435374, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7564102564102564, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.5920000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5522388059701493, |
|
"eval_ORGANIZATION_recall": 0.6379310344827587, |
|
"eval_PERSON_f1": 0.8136645962732919, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7705882352941177, |
|
"eval_PERSON_recall": 0.8618421052631579, |
|
"eval_QUANTITY_f1": 0.6363636363636365, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.14613807201385498, |
|
"eval_overall_accuracy": 0.9523687580025608, |
|
"eval_overall_f1": 0.7621696801112657, |
|
"eval_overall_precision": 0.7191601049868767, |
|
"eval_overall_recall": 0.8106508875739645, |
|
"eval_runtime": 0.2921, |
|
"eval_samples_per_second": 640.177, |
|
"eval_steps_per_second": 10.27, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.7401907444000244, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.1528, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7843137254901961, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.5737704918032787, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.546875, |
|
"eval_ORGANIZATION_recall": 0.603448275862069, |
|
"eval_PERSON_f1": 0.8123076923076923, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7630057803468208, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.7246376811594204, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1483771950006485, |
|
"eval_overall_accuracy": 0.9518565941101153, |
|
"eval_overall_f1": 0.7568306010928961, |
|
"eval_overall_precision": 0.7030456852791879, |
|
"eval_overall_recall": 0.8195266272189349, |
|
"eval_runtime": 0.2861, |
|
"eval_samples_per_second": 653.665, |
|
"eval_steps_per_second": 10.487, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 2.5112438201904297, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.1498, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.5546218487394958, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5409836065573771, |
|
"eval_ORGANIZATION_recall": 0.5689655172413793, |
|
"eval_PERSON_f1": 0.8159509202453987, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.764367816091954, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14724135398864746, |
|
"eval_overall_accuracy": 0.9498079385403329, |
|
"eval_overall_f1": 0.7534246575342467, |
|
"eval_overall_precision": 0.701530612244898, |
|
"eval_overall_recall": 0.8136094674556213, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.903, |
|
"eval_steps_per_second": 10.474, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 1.1626933813095093, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.1439, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.5438596491228069, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5535714285714286, |
|
"eval_ORGANIZATION_recall": 0.5344827586206896, |
|
"eval_PERSON_f1": 0.8161993769470405, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7751479289940828, |
|
"eval_PERSON_recall": 0.8618421052631579, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.14064399898052216, |
|
"eval_overall_accuracy": 0.9526248399487837, |
|
"eval_overall_f1": 0.7647058823529411, |
|
"eval_overall_precision": 0.726063829787234, |
|
"eval_overall_recall": 0.8076923076923077, |
|
"eval_runtime": 0.2933, |
|
"eval_samples_per_second": 637.623, |
|
"eval_steps_per_second": 10.229, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.9214287996292114, |
|
"learning_rate": 4e-05, |
|
"loss": 0.141, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.5833333333333335, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5645161290322581, |
|
"eval_ORGANIZATION_recall": 0.603448275862069, |
|
"eval_PERSON_f1": 0.822429906542056, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7810650887573964, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14049667119979858, |
|
"eval_overall_accuracy": 0.954673495518566, |
|
"eval_overall_f1": 0.7711511789181693, |
|
"eval_overall_precision": 0.7258485639686684, |
|
"eval_overall_recall": 0.8224852071005917, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.829, |
|
"eval_steps_per_second": 10.265, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 0.5010473132133484, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.1371, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8157894736842105, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6315789473684211, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.56, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.823529411764706, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7777777777777778, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14421436190605164, |
|
"eval_overall_accuracy": 0.9539052496798975, |
|
"eval_overall_f1": 0.7761194029850746, |
|
"eval_overall_precision": 0.7167919799498746, |
|
"eval_overall_recall": 0.8461538461538461, |
|
"eval_runtime": 0.2914, |
|
"eval_samples_per_second": 641.695, |
|
"eval_steps_per_second": 10.295, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 1.076838493347168, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.1341, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6046511627906976, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5492957746478874, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.825, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7857142857142857, |
|
"eval_PERSON_recall": 0.868421052631579, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13648565113544464, |
|
"eval_overall_accuracy": 0.9564660691421255, |
|
"eval_overall_f1": 0.7774725274725275, |
|
"eval_overall_precision": 0.7256410256410256, |
|
"eval_overall_recall": 0.8372781065088757, |
|
"eval_runtime": 0.292, |
|
"eval_samples_per_second": 640.416, |
|
"eval_steps_per_second": 10.274, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.791005551815033, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.1304, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8187919463087248, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.625, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5714285714285714, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.8297213622291022, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.783625730994152, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.13903699815273285, |
|
"eval_overall_accuracy": 0.9551856594110115, |
|
"eval_overall_f1": 0.7846364883401921, |
|
"eval_overall_precision": 0.731457800511509, |
|
"eval_overall_recall": 0.8461538461538461, |
|
"eval_runtime": 0.2925, |
|
"eval_samples_per_second": 639.291, |
|
"eval_steps_per_second": 10.256, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.3590947389602661, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.1318, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.65625, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8267477203647415, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.768361581920904, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14613154530525208, |
|
"eval_overall_accuracy": 0.9513444302176697, |
|
"eval_overall_f1": 0.775235531628533, |
|
"eval_overall_precision": 0.7111111111111111, |
|
"eval_overall_recall": 0.8520710059171598, |
|
"eval_runtime": 0.2919, |
|
"eval_samples_per_second": 640.557, |
|
"eval_steps_per_second": 10.276, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 1.1456764936447144, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.1283, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8266666666666668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6511627906976745, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5915492957746479, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8553459119496855, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13710016012191772, |
|
"eval_overall_accuracy": 0.9564660691421255, |
|
"eval_overall_f1": 0.7912087912087913, |
|
"eval_overall_precision": 0.7384615384615385, |
|
"eval_overall_recall": 0.8520710059171598, |
|
"eval_runtime": 0.2922, |
|
"eval_samples_per_second": 640.035, |
|
"eval_steps_per_second": 10.268, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 1.2503166198730469, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.1235, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8266666666666668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6614173228346457, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8430769230769231, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.791907514450867, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13993725180625916, |
|
"eval_overall_accuracy": 0.9554417413572344, |
|
"eval_overall_f1": 0.790190735694823, |
|
"eval_overall_precision": 0.7323232323232324, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 638.409, |
|
"eval_steps_per_second": 10.242, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.5744267702102661, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.1227, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.8322147651006713, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6206896551724138, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6206896551724138, |
|
"eval_ORGANIZATION_recall": 0.6206896551724138, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8095238095238095, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13400302827358246, |
|
"eval_overall_accuracy": 0.9559539052496799, |
|
"eval_overall_f1": 0.79382889200561, |
|
"eval_overall_precision": 0.7546666666666667, |
|
"eval_overall_recall": 0.8372781065088757, |
|
"eval_runtime": 0.2913, |
|
"eval_samples_per_second": 642.045, |
|
"eval_steps_per_second": 10.3, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 2.922327995300293, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.1237, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8322147651006713, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6393442622950819, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.609375, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.8589341692789968, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13434159755706787, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.7994428969359332, |
|
"eval_overall_precision": 0.7552631578947369, |
|
"eval_overall_recall": 0.849112426035503, |
|
"eval_runtime": 0.2921, |
|
"eval_samples_per_second": 640.264, |
|
"eval_steps_per_second": 10.272, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.862956702709198, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.1185, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6324786324786326, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6271186440677966, |
|
"eval_ORGANIZATION_recall": 0.6379310344827587, |
|
"eval_PERSON_f1": 0.8589341692789968, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13340412080287933, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.800561797752809, |
|
"eval_overall_precision": 0.7620320855614974, |
|
"eval_overall_recall": 0.8431952662721893, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 638.377, |
|
"eval_steps_per_second": 10.241, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 1.2341248989105225, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.1188, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6446280991735537, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6190476190476191, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.8517350157728707, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8181818181818182, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12923994660377502, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.800561797752809, |
|
"eval_overall_precision": 0.7620320855614974, |
|
"eval_overall_recall": 0.8431952662721893, |
|
"eval_runtime": 0.2916, |
|
"eval_samples_per_second": 641.346, |
|
"eval_steps_per_second": 10.289, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.7088314890861511, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.1157, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8322147651006713, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6050420168067226, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5901639344262295, |
|
"eval_ORGANIZATION_recall": 0.6206896551724138, |
|
"eval_PERSON_f1": 0.8411214953271028, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7988165680473372, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12962517142295837, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.787709497206704, |
|
"eval_overall_precision": 0.746031746031746, |
|
"eval_overall_recall": 0.834319526627219, |
|
"eval_runtime": 0.2921, |
|
"eval_samples_per_second": 640.291, |
|
"eval_steps_per_second": 10.272, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 1.4589393138885498, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.1159, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6166666666666667, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5967741935483871, |
|
"eval_ORGANIZATION_recall": 0.6379310344827587, |
|
"eval_PERSON_f1": 0.8427672955974843, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8072289156626506, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12884514033794403, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.7932489451476793, |
|
"eval_overall_precision": 0.7560321715817694, |
|
"eval_overall_recall": 0.834319526627219, |
|
"eval_runtime": 0.2858, |
|
"eval_samples_per_second": 654.233, |
|
"eval_steps_per_second": 10.496, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.7174299955368042, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.1156, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.628099173553719, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6031746031746031, |
|
"eval_ORGANIZATION_recall": 0.6551724137931034, |
|
"eval_PERSON_f1": 0.8417721518987342, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8109756097560976, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12961573898792267, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.7960618846694796, |
|
"eval_overall_precision": 0.7587131367292225, |
|
"eval_overall_recall": 0.8372781065088757, |
|
"eval_runtime": 0.2928, |
|
"eval_samples_per_second": 638.6, |
|
"eval_steps_per_second": 10.245, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.449804663658142, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.1105, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8435374149659864, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7948717948717948, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6962962962962962, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6103896103896104, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13476641476154327, |
|
"eval_overall_accuracy": 0.9587708066581306, |
|
"eval_overall_f1": 0.8076923076923076, |
|
"eval_overall_precision": 0.7538461538461538, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.2917, |
|
"eval_samples_per_second": 641.12, |
|
"eval_steps_per_second": 10.285, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 1.4639244079589844, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.1116, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6440677966101694, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6333333333333333, |
|
"eval_ORGANIZATION_recall": 0.6551724137931034, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8095238095238095, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1330917477607727, |
|
"eval_overall_accuracy": 0.9572343149807938, |
|
"eval_overall_f1": 0.7949790794979079, |
|
"eval_overall_precision": 0.7519788918205804, |
|
"eval_overall_recall": 0.8431952662721893, |
|
"eval_runtime": 0.285, |
|
"eval_samples_per_second": 656.101, |
|
"eval_steps_per_second": 10.526, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.7658966183662415, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.1115, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6393442622950819, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.609375, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.8454258675078864, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8121212121212121, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1309656947851181, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.7949790794979079, |
|
"eval_overall_precision": 0.7519788918205804, |
|
"eval_overall_recall": 0.8431952662721893, |
|
"eval_runtime": 0.2923, |
|
"eval_samples_per_second": 639.654, |
|
"eval_steps_per_second": 10.262, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.6558132767677307, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.1102, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7049180327868853, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.671875, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8463949843260188, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8083832335329342, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7246376811594204, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13514076173305511, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8044382801664354, |
|
"eval_overall_precision": 0.7571801566579635, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.2919, |
|
"eval_samples_per_second": 640.546, |
|
"eval_steps_per_second": 10.276, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 1.0988456010818481, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.1082, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7230769230769231, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6527777777777778, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.85625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8154761904761905, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7246376811594204, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13633978366851807, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8131868131868132, |
|
"eval_overall_precision": 0.7589743589743589, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2917, |
|
"eval_samples_per_second": 640.963, |
|
"eval_steps_per_second": 10.283, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 2.279130458831787, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.1055, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7107438016528926, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6825396825396826, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8490566037735849, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1300368756055832, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8123249299719889, |
|
"eval_overall_precision": 0.7712765957446809, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.2909, |
|
"eval_samples_per_second": 642.755, |
|
"eval_steps_per_second": 10.312, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 1.3240655660629272, |
|
"learning_rate": 3e-05, |
|
"loss": 0.1041, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7107438016528926, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6825396825396826, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8526645768025078, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1312866359949112, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8089260808926082, |
|
"eval_overall_precision": 0.7651715039577837, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.2908, |
|
"eval_samples_per_second": 643.094, |
|
"eval_steps_per_second": 10.317, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.6957283616065979, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.1046, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7068965517241379, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7068965517241379, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8535825545171339, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8106508875739645, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12765058875083923, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8208744710860366, |
|
"eval_overall_precision": 0.784366576819407, |
|
"eval_overall_recall": 0.8609467455621301, |
|
"eval_runtime": 0.2916, |
|
"eval_samples_per_second": 641.373, |
|
"eval_steps_per_second": 10.289, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 1.2302607297897339, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.1035, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6610169491525424, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.8589341692789968, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1273678094148636, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8152327221438647, |
|
"eval_overall_precision": 0.7789757412398922, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.2858, |
|
"eval_samples_per_second": 654.203, |
|
"eval_steps_per_second": 10.495, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 1.3074296712875366, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.1032, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6984126984126984, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8509316770186336, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8058823529411765, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13292378187179565, |
|
"eval_overall_accuracy": 0.9587708066581306, |
|
"eval_overall_f1": 0.8066298342541437, |
|
"eval_overall_precision": 0.7564766839378239, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.2869, |
|
"eval_samples_per_second": 651.864, |
|
"eval_steps_per_second": 10.458, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 4.577354907989502, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.1024, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.711864406779661, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8490566037735849, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12674523890018463, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8152327221438647, |
|
"eval_overall_precision": 0.7789757412398922, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.2861, |
|
"eval_samples_per_second": 653.585, |
|
"eval_steps_per_second": 10.485, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.4018518924713135, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.1002, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8526645768025078, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13057196140289307, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8200836820083682, |
|
"eval_overall_precision": 0.7757255936675461, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.329, |
|
"eval_steps_per_second": 10.481, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 1.6696031093597412, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.1001, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7580645161290323, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7121212121212122, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8526645768025078, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12734322249889374, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8251748251748251, |
|
"eval_overall_precision": 0.7824933687002652, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.285, |
|
"eval_samples_per_second": 656.038, |
|
"eval_steps_per_second": 10.525, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 1.0449410676956177, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0991, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7049180327868853, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.671875, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8553459119496855, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13027527928352356, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8134642356241234, |
|
"eval_overall_precision": 0.7733333333333333, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.2853, |
|
"eval_samples_per_second": 655.416, |
|
"eval_steps_per_second": 10.515, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 0.8292348980903625, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.097, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7166666666666668, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6935483870967742, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8553459119496855, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.12755466997623444, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8225352112676056, |
|
"eval_overall_precision": 0.7849462365591398, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.287, |
|
"eval_samples_per_second": 651.508, |
|
"eval_steps_per_second": 10.452, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 1.932066798210144, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0977, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7317073170731708, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8553459119496855, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1271757185459137, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8207282913165266, |
|
"eval_overall_precision": 0.7792553191489362, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.2859, |
|
"eval_samples_per_second": 654.146, |
|
"eval_steps_per_second": 10.494, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 3.0932295322418213, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0972, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6896551724137931, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6896551724137931, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.8454258675078864, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8121212121212121, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12482242286205292, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.813655761024182, |
|
"eval_overall_precision": 0.7835616438356164, |
|
"eval_overall_recall": 0.8461538461538461, |
|
"eval_runtime": 0.2852, |
|
"eval_samples_per_second": 655.67, |
|
"eval_steps_per_second": 10.519, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 2.206186532974243, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.096, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7213114754098361, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8553459119496855, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12892574071884155, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8202247191011235, |
|
"eval_overall_precision": 0.7807486631016043, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.2876, |
|
"eval_samples_per_second": 650.266, |
|
"eval_steps_per_second": 10.432, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 1.056382179260254, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0942, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7596899224806202, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6901408450704225, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8652037617554859, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8263473053892215, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13124997913837433, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8243430152143846, |
|
"eval_overall_precision": 0.7740259740259741, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.86, |
|
"eval_steps_per_second": 10.474, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.8895484805107117, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.096, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7377049180327868, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.703125, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8526645768025078, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12694130837917328, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8230337078651686, |
|
"eval_overall_precision": 0.7834224598930482, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.82, |
|
"eval_steps_per_second": 10.473, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.746292769908905, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.092, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7107438016528926, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6825396825396826, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8454258675078864, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8121212121212121, |
|
"eval_PERSON_recall": 0.881578947368421, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12707680463790894, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8117977528089887, |
|
"eval_overall_precision": 0.7727272727272727, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.2859, |
|
"eval_samples_per_second": 654.16, |
|
"eval_steps_per_second": 10.495, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 1.227086067199707, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0937, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6857142857142857, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12925828993320465, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.82336578581363, |
|
"eval_overall_precision": 0.7769028871391076, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2871, |
|
"eval_samples_per_second": 651.355, |
|
"eval_steps_per_second": 10.45, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.898246169090271, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.092, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6890756302521007, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6721311475409836, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8490566037735849, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12755441665649414, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8112676056338027, |
|
"eval_overall_precision": 0.7741935483870968, |
|
"eval_overall_recall": 0.8520710059171598, |
|
"eval_runtime": 0.287, |
|
"eval_samples_per_second": 651.657, |
|
"eval_steps_per_second": 10.454, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.8911055326461792, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0908, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7154471544715447, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.676923076923077, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8095238095238095, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12887853384017944, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8156424581005586, |
|
"eval_overall_precision": 0.7724867724867724, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.2871, |
|
"eval_samples_per_second": 651.377, |
|
"eval_steps_per_second": 10.45, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 1.0402631759643555, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.089, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8095238095238095, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12682482600212097, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8263305322128851, |
|
"eval_overall_precision": 0.7845744680851063, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2875, |
|
"eval_samples_per_second": 650.326, |
|
"eval_steps_per_second": 10.433, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 1.190384864807129, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.089, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7438016528925621, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7142857142857143, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8490566037735849, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.8881578947368421, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12504172325134277, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8236953455571228, |
|
"eval_overall_precision": 0.7870619946091644, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.2873, |
|
"eval_samples_per_second": 650.873, |
|
"eval_steps_per_second": 10.442, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 1.0693303346633911, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0885, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6865671641791045, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8625, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8214285714285714, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13093435764312744, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8194444444444444, |
|
"eval_overall_precision": 0.7722513089005235, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2863, |
|
"eval_samples_per_second": 653.072, |
|
"eval_steps_per_second": 10.477, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.5080128908157349, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0883, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7272727272727273, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6984126984126984, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.860759493670886, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8292682926829268, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12579382956027985, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8248587570621468, |
|
"eval_overall_precision": 0.7891891891891892, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.286, |
|
"eval_samples_per_second": 653.832, |
|
"eval_steps_per_second": 10.489, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 1.7690495252609253, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0896, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7166666666666668, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6935483870967742, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1268462985754013, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.8236953455571228, |
|
"eval_overall_precision": 0.7870619946091644, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.2866, |
|
"eval_samples_per_second": 652.454, |
|
"eval_steps_per_second": 10.467, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.6065536737442017, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0893, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7226890756302522, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7049180327868853, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8643533123028391, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12584134936332703, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8248587570621468, |
|
"eval_overall_precision": 0.7891891891891892, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.287, |
|
"eval_samples_per_second": 651.556, |
|
"eval_steps_per_second": 10.453, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 1.3564276695251465, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.089, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7559055118110236, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6956521739130435, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8742138364779874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7419354838709677, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.696969696969697, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.1324695646762848, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8227146814404432, |
|
"eval_overall_precision": 0.7734375, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2869, |
|
"eval_samples_per_second": 651.773, |
|
"eval_steps_per_second": 10.456, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.3449146747589111, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0892, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7559055118110236, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6956521739130435, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8742138364779874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13169027864933014, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8277777777777778, |
|
"eval_overall_precision": 0.7801047120418848, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2858, |
|
"eval_samples_per_second": 654.304, |
|
"eval_steps_per_second": 10.497, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 1.0803149938583374, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0877, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7540983606557378, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.71875, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12896300852298737, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8274894810659188, |
|
"eval_overall_precision": 0.7866666666666666, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.287, |
|
"eval_samples_per_second": 651.516, |
|
"eval_steps_per_second": 10.452, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.9663069248199463, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0856, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7540983606557378, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.71875, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8761904761904762, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13050326704978943, |
|
"eval_overall_accuracy": 0.9615877080665813, |
|
"eval_overall_f1": 0.8302945301542777, |
|
"eval_overall_precision": 0.7893333333333333, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2875, |
|
"eval_samples_per_second": 650.493, |
|
"eval_steps_per_second": 10.436, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.8305689692497253, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0862, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.765625, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8742138364779874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.1334487646818161, |
|
"eval_overall_accuracy": 0.9610755441741358, |
|
"eval_overall_f1": 0.826629680998613, |
|
"eval_overall_precision": 0.7780678851174935, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.302, |
|
"eval_steps_per_second": 10.481, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 1.218758463859558, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0867, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7419354838709677, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.696969696969697, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8769716088328074, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13092464208602905, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8319327731092437, |
|
"eval_overall_precision": 0.7898936170212766, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.309, |
|
"eval_steps_per_second": 10.481, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 2.1350855827331543, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0845, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6885245901639344, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1256009340286255, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8255319148936171, |
|
"eval_overall_precision": 0.7929155313351499, |
|
"eval_overall_recall": 0.8609467455621301, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 652.871, |
|
"eval_steps_per_second": 10.474, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.7863230109214783, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0864, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7377049180327868, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.703125, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8526645768025078, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7936507936507938, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7575757575757576, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12498261779546738, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8253521126760562, |
|
"eval_overall_precision": 0.7876344086021505, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.2858, |
|
"eval_samples_per_second": 654.227, |
|
"eval_steps_per_second": 10.496, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.7980266809463501, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0854, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7479674796747967, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7076923076923077, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8761904761904762, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12747858464717865, |
|
"eval_overall_accuracy": 0.9633802816901409, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2867, |
|
"eval_samples_per_second": 652.26, |
|
"eval_steps_per_second": 10.464, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 1.180917739868164, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0843, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7166666666666668, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6935483870967742, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.761904761904762, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7272727272727273, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12380669265985489, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8243626062322946, |
|
"eval_overall_precision": 0.7907608695652174, |
|
"eval_overall_recall": 0.8609467455621301, |
|
"eval_runtime": 0.2872, |
|
"eval_samples_per_second": 651.041, |
|
"eval_steps_per_second": 10.445, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.4001702070236206, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0871, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7741935483870968, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7272727272727273, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12895327806472778, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8359046283309958, |
|
"eval_overall_precision": 0.7946666666666666, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2856, |
|
"eval_samples_per_second": 654.718, |
|
"eval_steps_per_second": 10.503, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 2.398920774459839, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0836, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12761665880680084, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2871, |
|
"eval_samples_per_second": 651.419, |
|
"eval_steps_per_second": 10.451, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 1.136534333229065, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0825, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7741935483870968, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7272727272727273, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12773388624191284, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8359046283309958, |
|
"eval_overall_precision": 0.7946666666666666, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2872, |
|
"eval_samples_per_second": 651.096, |
|
"eval_steps_per_second": 10.445, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.9836848974227905, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0838, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12512867152690887, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8321579689703809, |
|
"eval_overall_precision": 0.7951482479784366, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.375, |
|
"eval_steps_per_second": 10.482, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.9845781326293945, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0846, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7580645161290323, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7121212121212122, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12692533433437347, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2872, |
|
"eval_samples_per_second": 651.198, |
|
"eval_steps_per_second": 10.447, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.7519234418869019, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0845, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7580645161290323, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7121212121212122, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12639828026294708, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.286, |
|
"eval_samples_per_second": 653.821, |
|
"eval_steps_per_second": 10.489, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.60317462682724, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0816, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7777777777777778, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7205882352941176, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8643533123028391, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.129006490111351, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8284518828451882, |
|
"eval_overall_precision": 0.783641160949868, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2865, |
|
"eval_samples_per_second": 652.715, |
|
"eval_steps_per_second": 10.471, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 1.9326316118240356, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0821, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7580645161290323, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7121212121212122, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12803098559379578, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2882, |
|
"eval_samples_per_second": 648.79, |
|
"eval_steps_per_second": 10.408, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.8638326525688171, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0823, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7777777777777778, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7205882352941176, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8769716088328074, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.13058307766914368, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.835195530726257, |
|
"eval_overall_precision": 0.791005291005291, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.2878, |
|
"eval_samples_per_second": 649.709, |
|
"eval_steps_per_second": 10.423, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 1.4908857345581055, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.082, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12721218168735504, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8321579689703809, |
|
"eval_overall_precision": 0.7951482479784366, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2865, |
|
"eval_samples_per_second": 652.793, |
|
"eval_steps_per_second": 10.473, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 1.9748855829238892, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0796, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7580645161290323, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7121212121212122, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7666666666666667, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7419354838709677, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.1286100149154663, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.829817158931083, |
|
"eval_overall_precision": 0.7908847184986595, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2859, |
|
"eval_samples_per_second": 654.048, |
|
"eval_steps_per_second": 10.493, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 1.6315678358078003, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.082, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7666666666666667, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7419354838709677, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.1274917721748352, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.828169014084507, |
|
"eval_overall_precision": 0.7903225806451613, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.2868, |
|
"eval_samples_per_second": 651.959, |
|
"eval_steps_per_second": 10.459, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 2.9988150596618652, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0827, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12789824604988098, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2874, |
|
"eval_samples_per_second": 650.709, |
|
"eval_steps_per_second": 10.439, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 2.0143356323242188, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0819, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8769716088328074, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12826670706272125, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8382559774964837, |
|
"eval_overall_precision": 0.7989276139410187, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2871, |
|
"eval_samples_per_second": 651.319, |
|
"eval_steps_per_second": 10.449, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 1.0121877193450928, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0775, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8643533123028391, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12668804824352264, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.286, |
|
"eval_samples_per_second": 653.86, |
|
"eval_steps_per_second": 10.49, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.6306910514831543, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0784, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7666666666666667, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7419354838709677, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.12889203429222107, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.368, |
|
"eval_steps_per_second": 10.482, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 1.8310757875442505, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0789, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12754952907562256, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8321579689703809, |
|
"eval_overall_precision": 0.7951482479784366, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2868, |
|
"eval_samples_per_second": 652.02, |
|
"eval_steps_per_second": 10.46, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 1.1900731325149536, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0808, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7741935483870968, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7272727272727273, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7666666666666667, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7419354838709677, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.1293194442987442, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8330995792426368, |
|
"eval_overall_precision": 0.792, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.306, |
|
"eval_steps_per_second": 10.481, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 1.54060959815979, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0788, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.8947368421052632, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12771408259868622, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8321579689703809, |
|
"eval_overall_precision": 0.7951482479784366, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 653.35, |
|
"eval_steps_per_second": 10.482, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.6988396644592285, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0791, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7741935483870968, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7272727272727273, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12927231192588806, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8359046283309958, |
|
"eval_overall_precision": 0.7946666666666666, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2858, |
|
"eval_samples_per_second": 654.3, |
|
"eval_steps_per_second": 10.497, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 1.71950364112854, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0786, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12867045402526855, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2924, |
|
"eval_samples_per_second": 639.556, |
|
"eval_steps_per_second": 10.26, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.9361959099769592, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0788, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1285109966993332, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2879, |
|
"eval_samples_per_second": 649.541, |
|
"eval_steps_per_second": 10.42, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.82219398021698, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0785, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8769716088328074, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12919461727142334, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8359046283309958, |
|
"eval_overall_precision": 0.7946666666666666, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.2913, |
|
"eval_samples_per_second": 641.926, |
|
"eval_steps_per_second": 10.298, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 1.4223874807357788, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.082, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12852250039577484, |
|
"eval_overall_accuracy": 0.9620998719590269, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2915, |
|
"eval_samples_per_second": 641.413, |
|
"eval_steps_per_second": 10.29, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.9472575187683105, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.078, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9013157894736842, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12840475142002106, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.2914, |
|
"eval_samples_per_second": 641.68, |
|
"eval_steps_per_second": 10.294, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.753296971321106, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0783, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12838655710220337, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8354430379746836, |
|
"eval_overall_precision": 0.7962466487935657, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2918, |
|
"eval_samples_per_second": 640.87, |
|
"eval_steps_per_second": 10.281, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.6992992758750916, |
|
"learning_rate": 0.0, |
|
"loss": 0.0773, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7642276422764227, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.7230769230769231, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8734177215189874, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.12858808040618896, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8354430379746836, |
|
"eval_overall_precision": 0.7962466487935657, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.2908, |
|
"eval_samples_per_second": 642.981, |
|
"eval_steps_per_second": 10.315, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 4500604309905474.0, |
|
"train_loss": 0.13730014378169797, |
|
"train_runtime": 547.2904, |
|
"train_samples_per_second": 308.246, |
|
"train_steps_per_second": 19.368 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 4500604309905474.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|