nerugm-pt-pl20-2 / trainer_state.json
apwic's picture
End of training
5432087 verified
raw
history blame
145 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.7605067491531372,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9861,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012820512820512822,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.07692307692307693,
"eval_PERSON_recall": 0.006993006993006993,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5554673075675964,
"eval_overall_accuracy": 0.8468851638729047,
"eval_overall_f1": 0.0055248618784530384,
"eval_overall_precision": 0.043478260869565216,
"eval_overall_recall": 0.0029498525073746312,
"eval_runtime": 0.9128,
"eval_samples_per_second": 204.873,
"eval_steps_per_second": 3.287,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.7613551616668701,
"learning_rate": 4.9e-05,
"loss": 0.5078,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.2150537634408602,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.47619047619047616,
"eval_LOCATION_recall": 0.1388888888888889,
"eval_ORGANIZATION_f1": 0.019417475728155338,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.03571428571428571,
"eval_ORGANIZATION_recall": 0.013333333333333334,
"eval_PERSON_f1": 0.6392961876832844,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.5505050505050505,
"eval_PERSON_recall": 0.7622377622377622,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.6206896551724138,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.5625,
"eval_TIME_recall": 0.6923076923076923,
"eval_loss": 0.3412609398365021,
"eval_overall_accuracy": 0.8961721290968226,
"eval_overall_f1": 0.43740095087163233,
"eval_overall_precision": 0.4726027397260274,
"eval_overall_recall": 0.40707964601769914,
"eval_runtime": 0.9577,
"eval_samples_per_second": 195.257,
"eval_steps_per_second": 3.132,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.2087492942810059,
"learning_rate": 4.85e-05,
"loss": 0.3115,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.5696969696969698,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.5053763440860215,
"eval_LOCATION_recall": 0.6527777777777778,
"eval_ORGANIZATION_f1": 0.5125628140703519,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.4112903225806452,
"eval_ORGANIZATION_recall": 0.68,
"eval_PERSON_f1": 0.8231511254019294,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7619047619047619,
"eval_PERSON_recall": 0.8951048951048951,
"eval_QUANTITY_f1": 0.4590163934426229,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.3684210526315789,
"eval_QUANTITY_recall": 0.6086956521739131,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.22766432166099548,
"eval_overall_accuracy": 0.9256942707030272,
"eval_overall_f1": 0.6607594936708862,
"eval_overall_precision": 0.5787139689578714,
"eval_overall_recall": 0.7699115044247787,
"eval_runtime": 0.9809,
"eval_samples_per_second": 190.638,
"eval_steps_per_second": 3.058,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 0.9383460283279419,
"learning_rate": 4.8e-05,
"loss": 0.2203,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.6993865030674847,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6263736263736264,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.6162790697674418,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5463917525773195,
"eval_ORGANIZATION_recall": 0.7066666666666667,
"eval_PERSON_f1": 0.8498402555910544,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7823529411764706,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.410958904109589,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.3,
"eval_QUANTITY_recall": 0.6521739130434783,
"eval_TIME_f1": 0.7419354838709676,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6388888888888888,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.21552342176437378,
"eval_overall_accuracy": 0.9316987740805605,
"eval_overall_f1": 0.7177522349936143,
"eval_overall_precision": 0.6328828828828829,
"eval_overall_recall": 0.8289085545722714,
"eval_runtime": 0.9352,
"eval_samples_per_second": 199.955,
"eval_steps_per_second": 3.208,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 2.1988296508789062,
"learning_rate": 4.75e-05,
"loss": 0.1816,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.7516778523489932,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7272727272727273,
"eval_LOCATION_recall": 0.7777777777777778,
"eval_ORGANIZATION_f1": 0.6553672316384181,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5686274509803921,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8794788273615636,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.823170731707317,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7142857142857143,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6060606060606061,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.9230769230769231,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.15413647890090942,
"eval_overall_accuracy": 0.9489617212909682,
"eval_overall_f1": 0.7908232118758435,
"eval_overall_precision": 0.7288557213930348,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9063,
"eval_samples_per_second": 206.339,
"eval_steps_per_second": 3.31,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.9543836116790771,
"learning_rate": 4.7e-05,
"loss": 0.1655,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7317073170731708,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6521739130434783,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7078651685393258,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6116504854368932,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8918032786885245,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6909090909090908,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.59375,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7241379310344829,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.65625,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15523788332939148,
"eval_overall_accuracy": 0.9504628471353516,
"eval_overall_f1": 0.7868421052631579,
"eval_overall_precision": 0.7102137767220903,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9116,
"eval_samples_per_second": 205.138,
"eval_steps_per_second": 3.291,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.4434598982334137,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1513,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7631578947368423,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7111111111111111,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6095238095238096,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8758169934640523,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8220858895705522,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7017543859649124,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5882352941176471,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.14643213152885437,
"eval_overall_accuracy": 0.952964723542657,
"eval_overall_f1": 0.7882822902796273,
"eval_overall_precision": 0.7184466019417476,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9227,
"eval_samples_per_second": 202.669,
"eval_steps_per_second": 3.251,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.7223401069641113,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1403,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7549668874172185,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.7093023255813953,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6288659793814433,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8829431438127091,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8461538461538461,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.6779661016949152,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6060606060606061,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.14050298929214478,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.7880434782608694,
"eval_overall_precision": 0.7304785894206549,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9407,
"eval_samples_per_second": 198.786,
"eval_steps_per_second": 3.189,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.0728905200958252,
"learning_rate": 4.55e-05,
"loss": 0.138,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.711864406779661,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6176470588235294,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14766837656497955,
"eval_overall_accuracy": 0.9527145359019265,
"eval_overall_f1": 0.814111261872456,
"eval_overall_precision": 0.7537688442211056,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9393,
"eval_samples_per_second": 199.079,
"eval_steps_per_second": 3.194,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 2.3210840225219727,
"learning_rate": 4.5e-05,
"loss": 0.1301,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7349397590361445,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6703296703296703,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5588235294117647,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13562895357608795,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8098495212038302,
"eval_overall_precision": 0.7551020408163265,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9309,
"eval_samples_per_second": 200.881,
"eval_steps_per_second": 3.223,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.8354237675666809,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.12,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7733333333333334,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7682926829268292,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7078651685393258,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7037037037037037,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6129032258064516,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.12984243035316467,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8155339805825244,
"eval_overall_precision": 0.7696335078534031,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9242,
"eval_samples_per_second": 202.333,
"eval_steps_per_second": 3.246,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 2.3830783367156982,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1171,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7945205479452055,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7837837837837838,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7195121951219511,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6629213483146067,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13061821460723877,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8072122052704578,
"eval_overall_precision": 0.7617801047120419,
"eval_overall_recall": 0.8584070796460177,
"eval_runtime": 0.9196,
"eval_samples_per_second": 203.355,
"eval_steps_per_second": 3.262,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.5705311894416809,
"learning_rate": 4.35e-05,
"loss": 0.1129,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7597765363128492,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6538461538461539,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7142857142857143,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6060606060606061,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13694216310977936,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8172043010752689,
"eval_overall_precision": 0.7506172839506173,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.9213,
"eval_samples_per_second": 202.983,
"eval_steps_per_second": 3.256,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.2299761772155762,
"learning_rate": 4.3e-05,
"loss": 0.1076,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7613636363636365,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6633663366336634,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6206896551724138,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5142857142857142,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7241379310344829,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.65625,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1426171064376831,
"eval_overall_accuracy": 0.9524643482611959,
"eval_overall_f1": 0.8064516129032259,
"eval_overall_precision": 0.7407407407407407,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9372,
"eval_samples_per_second": 199.528,
"eval_steps_per_second": 3.201,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.628875732421875,
"learning_rate": 4.25e-05,
"loss": 0.1056,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7674418604651163,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6804123711340206,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8859060402684563,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8516129032258064,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1336900293827057,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8170563961485556,
"eval_overall_precision": 0.7654639175257731,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9357,
"eval_samples_per_second": 199.851,
"eval_steps_per_second": 3.206,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.9760724902153015,
"learning_rate": 4.2e-05,
"loss": 0.1003,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7657142857142857,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.67,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.145399808883667,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8206521739130435,
"eval_overall_precision": 0.760705289672544,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9425,
"eval_samples_per_second": 198.413,
"eval_steps_per_second": 3.183,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.18460078537464142,
"learning_rate": 4.15e-05,
"loss": 0.0997,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7602339181286549,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6770833333333334,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8851351351351351,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8562091503267973,
"eval_PERSON_recall": 0.916083916083916,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1395619809627533,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8076923076923076,
"eval_overall_precision": 0.7557840616966581,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.923,
"eval_samples_per_second": 202.596,
"eval_steps_per_second": 3.25,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.43792226910591125,
"learning_rate": 4.1e-05,
"loss": 0.0956,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8169014084507044,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8285714285714286,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.726190476190476,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6559139784946236,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6909090909090908,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.59375,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13341191411018372,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8133704735376045,
"eval_overall_precision": 0.7704485488126649,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9563,
"eval_samples_per_second": 195.551,
"eval_steps_per_second": 3.137,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.8807380795478821,
"learning_rate": 4.05e-05,
"loss": 0.0906,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7945205479452054,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7542857142857142,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.66,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13378730416297913,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8120713305898491,
"eval_overall_precision": 0.7589743589743589,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9383,
"eval_samples_per_second": 199.303,
"eval_steps_per_second": 3.197,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.726658046245575,
"learning_rate": 4e-05,
"loss": 0.0876,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7727272727272727,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6732673267326733,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8322981366459627,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6909090909090908,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.59375,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1531873345375061,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8200270635994586,
"eval_overall_precision": 0.7575,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.9428,
"eval_samples_per_second": 198.355,
"eval_steps_per_second": 3.182,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.286189317703247,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0841,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7560975609756098,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6966292134831461,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8866666666666668,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8471337579617835,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1474735289812088,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8126721763085399,
"eval_overall_precision": 0.7622739018087855,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9368,
"eval_samples_per_second": 199.611,
"eval_steps_per_second": 3.202,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.40452536940574646,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0842,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7861271676300577,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6938775510204082,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.13896140456199646,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8228882833787466,
"eval_overall_precision": 0.7645569620253164,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9322,
"eval_samples_per_second": 200.611,
"eval_steps_per_second": 3.218,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.6667360663414001,
"learning_rate": 3.85e-05,
"loss": 0.0798,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.7945205479452055,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7837837837837838,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7666666666666667,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6571428571428571,
"eval_ORGANIZATION_recall": 0.92,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.631578947368421,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5294117647058824,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15068964660167694,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.814111261872456,
"eval_overall_precision": 0.7537688442211056,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 1.0035,
"eval_samples_per_second": 186.346,
"eval_steps_per_second": 2.99,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 0.6917049884796143,
"learning_rate": 3.8e-05,
"loss": 0.0775,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7692307692307693,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6896551724137931,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14417295157909393,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8319327731092437,
"eval_overall_precision": 0.792,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9311,
"eval_samples_per_second": 200.829,
"eval_steps_per_second": 3.222,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.38176143169403076,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0759,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.783625730994152,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6979166666666666,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6440677966101694,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5277777777777778,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7368421052631579,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6774193548387096,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14586655795574188,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8244897959183674,
"eval_overall_precision": 0.7651515151515151,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.9333,
"eval_samples_per_second": 200.36,
"eval_steps_per_second": 3.214,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.690096914768219,
"learning_rate": 3.7e-05,
"loss": 0.0731,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7945205479452054,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7975460122699386,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7386363636363636,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.151327446103096,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8312412831241284,
"eval_overall_precision": 0.7883597883597884,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9254,
"eval_samples_per_second": 202.071,
"eval_steps_per_second": 3.242,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.562192440032959,
"learning_rate": 3.65e-05,
"loss": 0.0714,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7654320987654321,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7126436781609196,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.15548019111156464,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8207282913165266,
"eval_overall_precision": 0.7813333333333333,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9366,
"eval_samples_per_second": 199.663,
"eval_steps_per_second": 3.203,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.1344366073608398,
"learning_rate": 3.6e-05,
"loss": 0.0697,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7808219178082192,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7702702702702703,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7450980392156864,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6785714285714286,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.14587517082691193,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8202247191011236,
"eval_overall_precision": 0.7828418230563002,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.92,
"eval_samples_per_second": 203.25,
"eval_steps_per_second": 3.261,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.7924529910087585,
"learning_rate": 3.55e-05,
"loss": 0.0701,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7176470588235295,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6421052631578947,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8986486486486487,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.869281045751634,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.5862068965517241,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.4857142857142857,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1690864861011505,
"eval_overall_accuracy": 0.9532149111833875,
"eval_overall_f1": 0.8055172413793102,
"eval_overall_precision": 0.7564766839378239,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.929,
"eval_samples_per_second": 201.295,
"eval_steps_per_second": 3.229,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.1464416980743408,
"learning_rate": 3.5e-05,
"loss": 0.0678,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8309859154929577,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7484662576687117,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6931818181818182,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7450980392156864,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6785714285714286,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14405371248722076,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8286516853932584,
"eval_overall_precision": 0.7908847184986595,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 1.0504,
"eval_samples_per_second": 178.034,
"eval_steps_per_second": 2.856,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.38195714354515076,
"learning_rate": 3.45e-05,
"loss": 0.0658,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7861271676300577,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6938775510204082,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7755102040816326,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7307692307692307,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.15743257105350494,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8381742738589212,
"eval_overall_precision": 0.7890625,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.9177,
"eval_samples_per_second": 203.771,
"eval_steps_per_second": 3.269,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.8308860659599304,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0648,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8428571428571429,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8676470588235294,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9016949152542374,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1516529768705368,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8354430379746836,
"eval_overall_precision": 0.7983870967741935,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 1.0211,
"eval_samples_per_second": 183.135,
"eval_steps_per_second": 2.938,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.37685203552246094,
"learning_rate": 3.35e-05,
"loss": 0.0626,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7945205479452055,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7837837837837838,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9016949152542374,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15304860472679138,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.82336578581363,
"eval_overall_precision": 0.7789473684210526,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9446,
"eval_samples_per_second": 197.961,
"eval_steps_per_second": 3.176,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.1034225225448608,
"learning_rate": 3.3e-05,
"loss": 0.0631,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7953216374269007,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7083333333333334,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7241379310344829,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.65625,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.16854536533355713,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8317373461012312,
"eval_overall_precision": 0.7755102040816326,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.937,
"eval_samples_per_second": 199.569,
"eval_steps_per_second": 3.202,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.6754740476608276,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0598,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8707482993197277,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7784431137724551,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7065217391304348,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8986486486486487,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.869281045751634,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.631578947368421,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5294117647058824,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1640816181898117,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8333333333333335,
"eval_overall_precision": 0.7874015748031497,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9325,
"eval_samples_per_second": 200.545,
"eval_steps_per_second": 3.217,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.5667424201965332,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.06,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8053691275167787,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1585589498281479,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.826629680998613,
"eval_overall_precision": 0.7801047120418848,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9262,
"eval_samples_per_second": 201.894,
"eval_steps_per_second": 3.239,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 2.2813751697540283,
"learning_rate": 3.15e-05,
"loss": 0.0564,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7701149425287357,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6767676767676768,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.16692771017551422,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8296703296703297,
"eval_overall_precision": 0.7763496143958869,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9304,
"eval_samples_per_second": 200.987,
"eval_steps_per_second": 3.224,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 1.5005148649215698,
"learning_rate": 3.1e-05,
"loss": 0.0583,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8169014084507044,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8285714285714286,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.15361984074115753,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8371428571428572,
"eval_overall_precision": 0.8116343490304709,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9285,
"eval_samples_per_second": 201.402,
"eval_steps_per_second": 3.231,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.37653887271881104,
"learning_rate": 3.05e-05,
"loss": 0.0545,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8111888111888113,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8169014084507042,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7647058823529413,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.16966940462589264,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8261474269819195,
"eval_overall_precision": 0.781578947368421,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9372,
"eval_samples_per_second": 199.533,
"eval_steps_per_second": 3.201,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 1.0764912366867065,
"learning_rate": 3e-05,
"loss": 0.0555,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7784431137724551,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7065217391304348,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.6896551724137931,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.625,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.16699136793613434,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8275862068965517,
"eval_overall_precision": 0.7772020725388601,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9355,
"eval_samples_per_second": 199.887,
"eval_steps_per_second": 3.207,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 1.2565559148788452,
"learning_rate": 2.95e-05,
"loss": 0.0536,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8513513513513513,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7928994082840236,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7127659574468085,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7368421052631579,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6774193548387096,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.16643501818180084,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8381742738589212,
"eval_overall_precision": 0.7890625,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.9907,
"eval_samples_per_second": 188.749,
"eval_steps_per_second": 3.028,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.8656229376792908,
"learning_rate": 2.9e-05,
"loss": 0.0528,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8827586206896552,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8767123287671232,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6206896551724138,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5142857142857142,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1719001978635788,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8305555555555555,
"eval_overall_precision": 0.7847769028871391,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9302,
"eval_samples_per_second": 201.029,
"eval_steps_per_second": 3.225,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.4717106819152832,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0505,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7469879518072289,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6813186813186813,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1703517884016037,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.8166666666666667,
"eval_overall_precision": 0.7716535433070866,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9281,
"eval_samples_per_second": 201.476,
"eval_steps_per_second": 3.232,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.6283421516418457,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.05,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8053691275167787,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.16587650775909424,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8205841446453408,
"eval_overall_precision": 0.7763157894736842,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.933,
"eval_samples_per_second": 200.427,
"eval_steps_per_second": 3.215,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.7488293051719666,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0515,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8611111111111112,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8611111111111112,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.759493670886076,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7228915662650602,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.631578947368421,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5294117647058824,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17817422747612,
"eval_overall_accuracy": 0.9544658493870403,
"eval_overall_f1": 0.8223776223776224,
"eval_overall_precision": 0.7819148936170213,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9321,
"eval_samples_per_second": 200.616,
"eval_steps_per_second": 3.218,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.3455760180950165,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0484,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7672955974842767,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7261904761904762,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8750000000000001,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8260869565217391,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1757228672504425,
"eval_overall_accuracy": 0.9549662246685013,
"eval_overall_f1": 0.8195804195804196,
"eval_overall_precision": 0.7792553191489362,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9328,
"eval_samples_per_second": 200.479,
"eval_steps_per_second": 3.216,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.9659437537193298,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0477,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7547169811320756,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17942465841770172,
"eval_overall_accuracy": 0.9549662246685013,
"eval_overall_f1": 0.8172942817294282,
"eval_overall_precision": 0.7751322751322751,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9384,
"eval_samples_per_second": 199.28,
"eval_steps_per_second": 3.197,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.39018484950065613,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0456,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8472222222222222,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8472222222222222,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.16816405951976776,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8373408769448375,
"eval_overall_precision": 0.8043478260869565,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9286,
"eval_samples_per_second": 201.387,
"eval_steps_per_second": 3.231,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.4282808303833008,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0458,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.863013698630137,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7052023121387283,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6224489795918368,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.18153227865695953,
"eval_overall_accuracy": 0.9547160370277709,
"eval_overall_f1": 0.8131868131868133,
"eval_overall_precision": 0.7609254498714653,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.927,
"eval_samples_per_second": 201.727,
"eval_steps_per_second": 3.236,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.5775999426841736,
"learning_rate": 2.5e-05,
"loss": 0.0449,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.728395061728395,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6781609195402298,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17358513176441193,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8223776223776224,
"eval_overall_precision": 0.7819148936170213,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9332,
"eval_samples_per_second": 200.395,
"eval_steps_per_second": 3.215,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.8392077684402466,
"learning_rate": 2.45e-05,
"loss": 0.0443,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7636363636363636,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17768125236034393,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8188105117565698,
"eval_overall_precision": 0.7708333333333334,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9419,
"eval_samples_per_second": 198.534,
"eval_steps_per_second": 3.185,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.5880552530288696,
"learning_rate": 2.4e-05,
"loss": 0.044,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8648648648648649,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7484662576687117,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6931818181818182,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17750605940818787,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8296089385474861,
"eval_overall_precision": 0.7877984084880637,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9391,
"eval_samples_per_second": 199.121,
"eval_steps_per_second": 3.194,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.7479882836341858,
"learning_rate": 2.35e-05,
"loss": 0.0436,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8648648648648649,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7469879518072289,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6813186813186813,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17619207501411438,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8220689655172414,
"eval_overall_precision": 0.772020725388601,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9329,
"eval_samples_per_second": 200.454,
"eval_steps_per_second": 3.216,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.6151536703109741,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0416,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8611111111111112,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8611111111111112,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7393939393939395,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6777777777777778,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.18319469690322876,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8256624825662482,
"eval_overall_precision": 0.783068783068783,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9355,
"eval_samples_per_second": 199.902,
"eval_steps_per_second": 3.207,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.720840334892273,
"learning_rate": 2.25e-05,
"loss": 0.0403,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7471264367816093,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6565656565656566,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8786885245901639,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8271604938271605,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1950027197599411,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.8147138964577656,
"eval_overall_precision": 0.7569620253164557,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9369,
"eval_samples_per_second": 199.604,
"eval_steps_per_second": 3.202,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.4839901924133301,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0422,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.821917808219178,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7439024390243902,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6853932584269663,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17818213999271393,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8184357541899441,
"eval_overall_precision": 0.7771883289124668,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9337,
"eval_samples_per_second": 200.278,
"eval_steps_per_second": 3.213,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.7197099924087524,
"learning_rate": 2.15e-05,
"loss": 0.0394,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8333333333333334,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7468354430379747,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7108433734939759,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8896321070234114,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8525641025641025,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17426693439483643,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8215297450424929,
"eval_overall_precision": 0.7901907356948229,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9259,
"eval_samples_per_second": 201.976,
"eval_steps_per_second": 3.24,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.526695191860199,
"learning_rate": 2.1e-05,
"loss": 0.0409,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7643312101910827,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7317073170731707,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.17505142092704773,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8195804195804196,
"eval_overall_precision": 0.7792553191489362,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9256,
"eval_samples_per_second": 202.037,
"eval_steps_per_second": 3.241,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.38071247935295105,
"learning_rate": 2.05e-05,
"loss": 0.0384,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7749999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7294117647058823,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8896321070234114,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8525641025641025,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.17447121441364288,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8228730822873082,
"eval_overall_precision": 0.7804232804232805,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9356,
"eval_samples_per_second": 199.869,
"eval_steps_per_second": 3.206,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.4309019446372986,
"learning_rate": 2e-05,
"loss": 0.0385,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8590604026845637,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7757575757575759,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7111111111111111,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.18776963651180267,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8264462809917357,
"eval_overall_precision": 0.7751937984496124,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9372,
"eval_samples_per_second": 199.53,
"eval_steps_per_second": 3.201,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.0351260900497437,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0371,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8309859154929577,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8428571428571429,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.763157894736842,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7532467532467533,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8778877887788779,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.83125,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.18786616623401642,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.8181818181818181,
"eval_overall_precision": 0.7890410958904109,
"eval_overall_recall": 0.8495575221238938,
"eval_runtime": 0.9236,
"eval_samples_per_second": 202.479,
"eval_steps_per_second": 3.248,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.6741280555725098,
"learning_rate": 1.9e-05,
"loss": 0.0385,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7972972972972973,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7894736842105264,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7792207792207793,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.18338263034820557,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8213783403656821,
"eval_overall_precision": 0.7849462365591398,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9302,
"eval_samples_per_second": 201.036,
"eval_steps_per_second": 3.225,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.2608901560306549,
"learning_rate": 1.85e-05,
"loss": 0.0359,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7777777777777777,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7241379310344828,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7017543859649122,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6451612903225806,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.18453986942768097,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8240223463687151,
"eval_overall_precision": 0.7824933687002652,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9321,
"eval_samples_per_second": 200.623,
"eval_steps_per_second": 3.219,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.7726385593414307,
"learning_rate": 1.8e-05,
"loss": 0.0355,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7484662576687117,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6931818181818182,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8322981366459627,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20165307819843292,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.812760055478502,
"eval_overall_precision": 0.7670157068062827,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.957,
"eval_samples_per_second": 195.402,
"eval_steps_per_second": 3.135,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.47850877046585083,
"learning_rate": 1.75e-05,
"loss": 0.0338,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7972972972972973,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7564102564102564,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1862517148256302,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8215297450424929,
"eval_overall_precision": 0.7901907356948229,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9305,
"eval_samples_per_second": 200.976,
"eval_steps_per_second": 3.224,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 1.3503855466842651,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0376,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7792207792207794,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.759493670886076,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1855112761259079,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8218793828892006,
"eval_overall_precision": 0.7834224598930482,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9291,
"eval_samples_per_second": 201.265,
"eval_steps_per_second": 3.229,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.09078435599803925,
"learning_rate": 1.65e-05,
"loss": 0.0324,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7564102564102564,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8675496688741723,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8238993710691824,
"eval_PERSON_recall": 0.916083916083916,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19535928964614868,
"eval_overall_accuracy": 0.9547160370277709,
"eval_overall_f1": 0.810126582278481,
"eval_overall_precision": 0.7741935483870968,
"eval_overall_recall": 0.8495575221238938,
"eval_runtime": 0.923,
"eval_samples_per_second": 202.594,
"eval_steps_per_second": 3.25,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.13197369873523712,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0361,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8770764119601329,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8354430379746836,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.2019178867340088,
"eval_overall_accuracy": 0.9534650988241181,
"eval_overall_f1": 0.8117154811715481,
"eval_overall_precision": 0.7698412698412699,
"eval_overall_recall": 0.8584070796460177,
"eval_runtime": 0.9293,
"eval_samples_per_second": 201.226,
"eval_steps_per_second": 3.228,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.3539793789386749,
"learning_rate": 1.55e-05,
"loss": 0.0329,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7468354430379747,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7108433734939759,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8741721854304637,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8301886792452831,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1934998482465744,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8157524613220816,
"eval_overall_precision": 0.7795698924731183,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9314,
"eval_samples_per_second": 200.776,
"eval_steps_per_second": 3.221,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.4102155566215515,
"learning_rate": 1.5e-05,
"loss": 0.0336,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8590604026845637,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.18642878532409668,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8256624825662482,
"eval_overall_precision": 0.783068783068783,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9273,
"eval_samples_per_second": 201.662,
"eval_steps_per_second": 3.235,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.9542334675788879,
"learning_rate": 1.45e-05,
"loss": 0.0346,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.6987951807228915,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6373626373626373,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.18929119408130646,
"eval_overall_accuracy": 0.9549662246685013,
"eval_overall_f1": 0.8044382801664355,
"eval_overall_precision": 0.7591623036649214,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9224,
"eval_samples_per_second": 202.728,
"eval_steps_per_second": 3.252,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.808494508266449,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0312,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8378378378378378,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1959969848394394,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8212290502793296,
"eval_overall_precision": 0.7798408488063661,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9295,
"eval_samples_per_second": 201.192,
"eval_steps_per_second": 3.228,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 1.9524306058883667,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0342,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7544910179640718,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6847826086956522,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8800000000000001,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8407643312101911,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19410043954849243,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.8183079056865463,
"eval_overall_precision": 0.7722513089005235,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 1.0344,
"eval_samples_per_second": 180.783,
"eval_steps_per_second": 2.9,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.1691898107528687,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0319,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.847682119205298,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7701863354037267,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7209302325581395,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8823529411764706,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1930677443742752,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8236914600550964,
"eval_overall_precision": 0.772609819121447,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9301,
"eval_samples_per_second": 201.064,
"eval_steps_per_second": 3.226,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 1.1448065042495728,
"learning_rate": 1.25e-05,
"loss": 0.0293,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7058823529411765,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8712871287128713,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.825,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7547169811320754,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7407407407407407,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1969723254442215,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.8145048814504882,
"eval_overall_precision": 0.7724867724867724,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.934,
"eval_samples_per_second": 200.216,
"eval_steps_per_second": 3.212,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.8883477449417114,
"learning_rate": 1.2e-05,
"loss": 0.0311,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7530864197530864,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7011494252873564,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8823529411764706,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.18665479123592377,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8243430152143844,
"eval_overall_precision": 0.7760416666666666,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9252,
"eval_samples_per_second": 202.11,
"eval_steps_per_second": 3.242,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.35357949137687683,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0299,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7530864197530864,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7011494252873564,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19146093726158142,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8181818181818181,
"eval_overall_precision": 0.7674418604651163,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9261,
"eval_samples_per_second": 201.927,
"eval_steps_per_second": 3.239,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.7683406472206116,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.03,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7354838709677418,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7125,
"eval_ORGANIZATION_recall": 0.76,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19335182011127472,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8140845070422535,
"eval_overall_precision": 0.7789757412398922,
"eval_overall_recall": 0.8525073746312685,
"eval_runtime": 0.9288,
"eval_samples_per_second": 201.33,
"eval_steps_per_second": 3.23,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 1.1292208433151245,
"learning_rate": 1.05e-05,
"loss": 0.0305,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7577639751552795,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7093023255813954,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1943107694387436,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8172942817294282,
"eval_overall_precision": 0.7751322751322751,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9335,
"eval_samples_per_second": 200.331,
"eval_steps_per_second": 3.214,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.6603876948356628,
"learning_rate": 1e-05,
"loss": 0.0306,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7945205479452054,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7577639751552795,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7093023255813954,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8823529411764706,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.19313213229179382,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8161559888579387,
"eval_overall_precision": 0.7730870712401056,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9289,
"eval_samples_per_second": 201.304,
"eval_steps_per_second": 3.229,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.466139554977417,
"learning_rate": 9.5e-06,
"loss": 0.0286,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7701863354037267,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7209302325581395,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8758169934640523,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8220858895705522,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19068394601345062,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8138888888888888,
"eval_overall_precision": 0.7690288713910761,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9312,
"eval_samples_per_second": 200.826,
"eval_steps_per_second": 3.222,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.6404593586921692,
"learning_rate": 9e-06,
"loss": 0.0283,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.725,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8692810457516339,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8159509202453987,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19274306297302246,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8105849582172702,
"eval_overall_precision": 0.7678100263852242,
"eval_overall_recall": 0.8584070796460177,
"eval_runtime": 0.9998,
"eval_samples_per_second": 187.045,
"eval_steps_per_second": 3.001,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.17559492588043213,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0289,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7945205479452054,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7058823529411765,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8750000000000001,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8260869565217391,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1927793323993683,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8083916083916084,
"eval_overall_precision": 0.7686170212765957,
"eval_overall_recall": 0.8525073746312685,
"eval_runtime": 0.9268,
"eval_samples_per_second": 201.759,
"eval_steps_per_second": 3.237,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 1.3301130533218384,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0289,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7530864197530864,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7011494252873564,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.19638177752494812,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8172942817294282,
"eval_overall_precision": 0.7751322751322751,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9332,
"eval_samples_per_second": 200.396,
"eval_steps_per_second": 3.215,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.19960090517997742,
"learning_rate": 7.5e-06,
"loss": 0.0283,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8053691275167787,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7564102564102564,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8823529411764706,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19612807035446167,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8145048814504882,
"eval_overall_precision": 0.7724867724867724,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9383,
"eval_samples_per_second": 199.303,
"eval_steps_per_second": 3.197,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.7677280306816101,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0279,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7564102564102564,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8786885245901639,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8271604938271605,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20059086382389069,
"eval_overall_accuracy": 0.9549662246685013,
"eval_overall_f1": 0.8089260808926081,
"eval_overall_precision": 0.7671957671957672,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9285,
"eval_samples_per_second": 201.396,
"eval_steps_per_second": 3.231,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.65785813331604,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0288,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8053691275167787,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7701863354037267,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7209302325581395,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8758169934640523,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8220858895705522,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20255452394485474,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8144044321329639,
"eval_overall_precision": 0.7676240208877284,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9402,
"eval_samples_per_second": 198.885,
"eval_steps_per_second": 3.191,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 1.4090750217437744,
"learning_rate": 6e-06,
"loss": 0.0275,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7450980392156863,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7307692307692307,
"eval_ORGANIZATION_recall": 0.76,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8242424242424242,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19975264370441437,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.812239221140473,
"eval_overall_precision": 0.7684210526315789,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9248,
"eval_samples_per_second": 202.217,
"eval_steps_per_second": 3.244,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.6550692319869995,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0272,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7515151515151515,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6888888888888889,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8794788273615636,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.823170731707317,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19843065738677979,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.8159340659340658,
"eval_overall_precision": 0.7634961439588689,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9223,
"eval_samples_per_second": 202.76,
"eval_steps_per_second": 3.253,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.794690489768982,
"learning_rate": 5e-06,
"loss": 0.0265,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.821917808219178,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7770700636942677,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7439024390243902,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8823529411764706,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20021091401576996,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8223776223776224,
"eval_overall_precision": 0.7819148936170213,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9203,
"eval_samples_per_second": 203.198,
"eval_steps_per_second": 3.26,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.0694357305765152,
"learning_rate": 4.5e-06,
"loss": 0.0258,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7547169811320756,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8729641693811075,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8170731707317073,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1959146112203598,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.812760055478502,
"eval_overall_precision": 0.7670157068062827,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9378,
"eval_samples_per_second": 199.393,
"eval_steps_per_second": 3.199,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.7855161428451538,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0256,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7625,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7176470588235294,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.868421052631579,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8198757763975155,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20366288721561432,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8166666666666667,
"eval_overall_precision": 0.7716535433070866,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9223,
"eval_samples_per_second": 202.758,
"eval_steps_per_second": 3.253,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.923471212387085,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.026,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8712871287128713,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.825,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20790377259254456,
"eval_overall_accuracy": 0.9547160370277709,
"eval_overall_f1": 0.8166666666666667,
"eval_overall_precision": 0.7716535433070866,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9308,
"eval_samples_per_second": 200.901,
"eval_steps_per_second": 3.223,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.5129814147949219,
"learning_rate": 3e-06,
"loss": 0.0269,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7672955974842767,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7261904761904762,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.868421052631579,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8198757763975155,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.2034631371498108,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.8138888888888888,
"eval_overall_precision": 0.7690288713910761,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9303,
"eval_samples_per_second": 201.002,
"eval_steps_per_second": 3.225,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.9843897819519043,
"learning_rate": 2.5e-06,
"loss": 0.0254,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7625,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7176470588235294,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20722047984600067,
"eval_overall_accuracy": 0.9549662246685013,
"eval_overall_f1": 0.8144044321329639,
"eval_overall_precision": 0.7676240208877284,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9384,
"eval_samples_per_second": 199.274,
"eval_steps_per_second": 3.197,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.45156100392341614,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0255,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.759493670886076,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7228915662650602,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.868421052631579,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8198757763975155,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20072737336158752,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.8150208623087621,
"eval_overall_precision": 0.7710526315789473,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.93,
"eval_samples_per_second": 201.077,
"eval_steps_per_second": 3.226,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.905977725982666,
"learning_rate": 1.5e-06,
"loss": 0.0248,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7612903225806452,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7375,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.201884463429451,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.8145048814504882,
"eval_overall_precision": 0.7724867724867724,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9411,
"eval_samples_per_second": 198.713,
"eval_steps_per_second": 3.188,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.701413631439209,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0258,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.759493670886076,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7228915662650602,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.868421052631579,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8198757763975155,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20242148637771606,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.812239221140473,
"eval_overall_precision": 0.7684210526315789,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9222,
"eval_samples_per_second": 202.767,
"eval_steps_per_second": 3.253,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.5330938696861267,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0251,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.2052735686302185,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8166666666666667,
"eval_overall_precision": 0.7716535433070866,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9322,
"eval_samples_per_second": 200.61,
"eval_steps_per_second": 3.218,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.6201446652412415,
"learning_rate": 0.0,
"loss": 0.0255,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7643312101910827,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7317073170731707,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7407407407407408,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.20351509749889374,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.8133704735376045,
"eval_overall_precision": 0.7704485488126649,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9365,
"eval_samples_per_second": 199.684,
"eval_steps_per_second": 3.203,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5023623771566022.0,
"train_loss": 0.07431833881252217,
"train_runtime": 1320.4476,
"train_samples_per_second": 127.76,
"train_steps_per_second": 8.028
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5023623771566022.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}