nerugm-pt-pl50-3 / trainer_state.json
apwic's picture
End of training
8b3c2e5 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 2.1874585151672363,
"learning_rate": 4.9500000000000004e-05,
"loss": 1.0045,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012121212121212121,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.06666666666666667,
"eval_PERSON_recall": 0.006666666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5767342448234558,
"eval_overall_accuracy": 0.8433559650824443,
"eval_overall_f1": 0.005434782608695652,
"eval_overall_precision": 0.047619047619047616,
"eval_overall_recall": 0.002881844380403458,
"eval_runtime": 0.3512,
"eval_samples_per_second": 532.399,
"eval_steps_per_second": 8.541,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.000261664390564,
"learning_rate": 4.9e-05,
"loss": 0.4985,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.3859649122807017,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5116279069767442,
"eval_LOCATION_recall": 0.30985915492957744,
"eval_ORGANIZATION_f1": 0.14184397163120568,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.13157894736842105,
"eval_ORGANIZATION_recall": 0.15384615384615385,
"eval_PERSON_f1": 0.7315634218289085,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.656084656084656,
"eval_PERSON_recall": 0.8266666666666667,
"eval_QUANTITY_f1": 0.15625,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.16129032258064516,
"eval_QUANTITY_recall": 0.15151515151515152,
"eval_TIME_f1": 0.7,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.65625,
"eval_TIME_recall": 0.75,
"eval_loss": 0.34785470366477966,
"eval_overall_accuracy": 0.9083414161008729,
"eval_overall_f1": 0.5069637883008357,
"eval_overall_precision": 0.49056603773584906,
"eval_overall_recall": 0.5244956772334294,
"eval_runtime": 0.3485,
"eval_samples_per_second": 536.657,
"eval_steps_per_second": 8.609,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 0.8842161297798157,
"learning_rate": 4.85e-05,
"loss": 0.2936,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.6119402985074627,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6507936507936508,
"eval_LOCATION_recall": 0.5774647887323944,
"eval_ORGANIZATION_f1": 0.4255319148936171,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.39473684210526316,
"eval_ORGANIZATION_recall": 0.46153846153846156,
"eval_PERSON_f1": 0.8238993710691823,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7797619047619048,
"eval_PERSON_recall": 0.8733333333333333,
"eval_QUANTITY_f1": 0.5866666666666667,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5238095238095238,
"eval_QUANTITY_recall": 0.6666666666666666,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.2019408941268921,
"eval_overall_accuracy": 0.9340446168768186,
"eval_overall_f1": 0.6850828729281768,
"eval_overall_precision": 0.6578249336870027,
"eval_overall_recall": 0.7146974063400576,
"eval_runtime": 0.3515,
"eval_samples_per_second": 531.999,
"eval_steps_per_second": 8.535,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.0422954559326172,
"learning_rate": 4.8e-05,
"loss": 0.2113,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.6666666666666667,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.611764705882353,
"eval_LOCATION_recall": 0.7323943661971831,
"eval_ORGANIZATION_f1": 0.6583850931677019,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5520833333333334,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8473520249221183,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7953216374269005,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1662513017654419,
"eval_overall_accuracy": 0.9459262851600388,
"eval_overall_f1": 0.7574578469520102,
"eval_overall_precision": 0.6886792452830188,
"eval_overall_recall": 0.8414985590778098,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.64,
"eval_steps_per_second": 8.561,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.0871312618255615,
"learning_rate": 4.75e-05,
"loss": 0.1824,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.6951219512195121,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6129032258064516,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.6580645161290322,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5666666666666667,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8607594936708859,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8192771084337349,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7088607594936709,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6086956521739131,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15956708788871765,
"eval_overall_accuracy": 0.944713870029098,
"eval_overall_f1": 0.7609254498714653,
"eval_overall_precision": 0.6867749419953596,
"eval_overall_recall": 0.8530259365994236,
"eval_runtime": 0.3507,
"eval_samples_per_second": 533.247,
"eval_steps_per_second": 8.555,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.1978598833084106,
"learning_rate": 4.7e-05,
"loss": 0.1647,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.6946107784431137,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6041666666666666,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.651685393258427,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5132743362831859,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8404907975460122,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7784090909090909,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6588235294117647,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5384615384615384,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7164179104477612,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6153846153846154,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1713540256023407,
"eval_overall_accuracy": 0.9369544131910766,
"eval_overall_f1": 0.741190765492102,
"eval_overall_precision": 0.6407563025210085,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3521,
"eval_samples_per_second": 531.071,
"eval_steps_per_second": 8.52,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 1.5508997440338135,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1533,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.6993865030674846,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6195652173913043,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.6790123456790124,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5670103092783505,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8598130841121495,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8070175438596491,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14624279737472534,
"eval_overall_accuracy": 0.9510184287099903,
"eval_overall_f1": 0.770408163265306,
"eval_overall_precision": 0.6910755148741419,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3512,
"eval_samples_per_second": 532.397,
"eval_steps_per_second": 8.541,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.8642424941062927,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1405,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7407407407407407,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6593406593406593,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.6783625730994152,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5471698113207547,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13807082176208496,
"eval_overall_accuracy": 0.950533462657614,
"eval_overall_f1": 0.7861715749039692,
"eval_overall_precision": 0.7073732718894009,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.624,
"eval_steps_per_second": 8.561,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.233667254447937,
"learning_rate": 4.55e-05,
"loss": 0.1341,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7741935483870968,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.6785714285714285,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5533980582524272,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8562091503267975,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8397435897435898,
"eval_PERSON_recall": 0.8733333333333333,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13261349499225616,
"eval_overall_accuracy": 0.9495635305528612,
"eval_overall_f1": 0.7869281045751635,
"eval_overall_precision": 0.7200956937799043,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3537,
"eval_samples_per_second": 528.626,
"eval_steps_per_second": 8.481,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.0353517532348633,
"learning_rate": 4.5e-05,
"loss": 0.1274,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7096774193548387,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1223028227686882,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8191489361702129,
"eval_overall_precision": 0.7604938271604939,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3511,
"eval_samples_per_second": 532.631,
"eval_steps_per_second": 8.545,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.7219051122665405,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1232,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7204968944099378,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6041666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1300116926431656,
"eval_overall_accuracy": 0.9529582929194956,
"eval_overall_f1": 0.8083989501312335,
"eval_overall_precision": 0.7421686746987952,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.192,
"eval_steps_per_second": 8.57,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.0894474983215332,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1195,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.728395061728395,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6483516483516484,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.6909090909090909,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.57,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14111082255840302,
"eval_overall_accuracy": 0.9522308438409312,
"eval_overall_f1": 0.7917205692108668,
"eval_overall_precision": 0.7183098591549296,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3502,
"eval_samples_per_second": 534.002,
"eval_steps_per_second": 8.567,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.5753965377807617,
"learning_rate": 4.35e-05,
"loss": 0.1138,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7239263803680982,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6020408163265306,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.9259259259259259,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9615384615384616,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12571823596954346,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8260292164674636,
"eval_overall_precision": 0.7660098522167488,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3506,
"eval_samples_per_second": 533.355,
"eval_steps_per_second": 8.556,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.7395552396774292,
"learning_rate": 4.3e-05,
"loss": 0.1106,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7160493827160493,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5979381443298969,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7088607594936709,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6086956521739131,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1278010457754135,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.8104575163398693,
"eval_overall_precision": 0.7416267942583732,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3503,
"eval_samples_per_second": 533.795,
"eval_steps_per_second": 8.564,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.1085916757583618,
"learning_rate": 4.25e-05,
"loss": 0.1037,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7375,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6210526315789474,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.691358024691358,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1332232654094696,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.81877444589309,
"eval_overall_precision": 0.7476190476190476,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.13,
"eval_steps_per_second": 8.569,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.2298065423965454,
"learning_rate": 4.2e-05,
"loss": 0.1015,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7453416149068324,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6506024096385542,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.54,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13960066437721252,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.811443433029909,
"eval_overall_precision": 0.7393364928909952,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3495,
"eval_samples_per_second": 535.049,
"eval_steps_per_second": 8.584,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.7031758427619934,
"learning_rate": 4.15e-05,
"loss": 0.0958,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.728395061728395,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6082474226804123,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12715467810630798,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8274044795783926,
"eval_overall_precision": 0.7621359223300971,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3498,
"eval_samples_per_second": 534.552,
"eval_steps_per_second": 8.576,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.8438174724578857,
"learning_rate": 4.1e-05,
"loss": 0.0957,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7017543859649122,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5660377358490566,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14869378507137299,
"eval_overall_accuracy": 0.9527158098933075,
"eval_overall_f1": 0.8067010309278351,
"eval_overall_precision": 0.7296037296037297,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3502,
"eval_samples_per_second": 534.029,
"eval_steps_per_second": 8.567,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.7291853427886963,
"learning_rate": 4.05e-05,
"loss": 0.0943,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7195121951219511,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5959595959595959,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12535077333450317,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8258575197889182,
"eval_overall_precision": 0.7615571776155717,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3513,
"eval_samples_per_second": 532.375,
"eval_steps_per_second": 8.541,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.0950889587402344,
"learning_rate": 4e-05,
"loss": 0.0915,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7421383647798743,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6276595744680851,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.9259259259259259,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9615384615384616,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12668967247009277,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8335552596537948,
"eval_overall_precision": 0.7747524752475248,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.636,
"eval_steps_per_second": 8.561,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.227335810661316,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0834,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6931818181818182,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7239263803680982,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6020408163265306,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6410256410256411,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5555555555555556,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8928571428571429,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1432582437992096,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.8057366362451109,
"eval_overall_precision": 0.7357142857142858,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.585,
"eval_steps_per_second": 8.56,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.8867971301078796,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0839,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7329192546583851,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6145833333333334,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6582278481012658,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5652173913043478,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8928571428571429,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14338690042495728,
"eval_overall_accuracy": 0.9546556741028128,
"eval_overall_f1": 0.8184210526315788,
"eval_overall_precision": 0.7530266343825666,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.745,
"eval_steps_per_second": 8.579,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 1.0698140859603882,
"learning_rate": 3.85e-05,
"loss": 0.0807,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7195121951219511,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5959595959595959,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.912621359223301,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13598859310150146,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8252299605781866,
"eval_overall_precision": 0.7584541062801933,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3499,
"eval_samples_per_second": 534.445,
"eval_steps_per_second": 8.574,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 0.7420476675033569,
"learning_rate": 3.8e-05,
"loss": 0.0771,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7215189873417722,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6129032258064516,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9137380191693292,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.9533333333333334,
"eval_QUANTITY_f1": 0.6419753086419753,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5416666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14340347051620483,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.8152031454783748,
"eval_overall_precision": 0.7475961538461539,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3509,
"eval_samples_per_second": 532.923,
"eval_steps_per_second": 8.55,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 1.0963969230651855,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0772,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7770700636942676,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7065868263473054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5784313725490197,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6428571428571428,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5294117647058824,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1520393043756485,
"eval_overall_accuracy": 0.9502909796314258,
"eval_overall_f1": 0.8010269576379975,
"eval_overall_precision": 0.7222222222222222,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3508,
"eval_samples_per_second": 533.007,
"eval_steps_per_second": 8.551,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.38709110021591187,
"learning_rate": 3.7e-05,
"loss": 0.0732,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7741935483870968,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7499999999999999,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.631578947368421,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.9259259259259259,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9615384615384616,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14221937954425812,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8243064729194188,
"eval_overall_precision": 0.7609756097560976,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3493,
"eval_samples_per_second": 535.398,
"eval_steps_per_second": 8.589,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.5424766540527344,
"learning_rate": 3.65e-05,
"loss": 0.0731,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7564102564102564,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6483516483516484,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.65,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5531914893617021,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.13665592670440674,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8184210526315788,
"eval_overall_precision": 0.7530266343825666,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3499,
"eval_samples_per_second": 534.475,
"eval_steps_per_second": 8.574,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 2.6486599445343018,
"learning_rate": 3.6e-05,
"loss": 0.0697,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7160493827160493,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5979381443298969,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9142857142857144,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.96,
"eval_QUANTITY_f1": 0.6329113924050633,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5434782608695652,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14497701823711395,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.8151041666666666,
"eval_overall_precision": 0.7434679334916865,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.595,
"eval_steps_per_second": 8.56,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.7765714526176453,
"learning_rate": 3.55e-05,
"loss": 0.0689,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7085714285714286,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5636363636363636,
"eval_ORGANIZATION_recall": 0.9538461538461539,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.7936507936507937,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15288624167442322,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.8097686375321336,
"eval_overall_precision": 0.7308584686774942,
"eval_overall_recall": 0.9077809798270894,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.16,
"eval_steps_per_second": 8.569,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.8394734263420105,
"learning_rate": 3.5e-05,
"loss": 0.0669,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7421383647798743,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6276595744680851,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14122405648231506,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8157894736842105,
"eval_overall_precision": 0.7506053268765133,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3503,
"eval_samples_per_second": 533.82,
"eval_steps_per_second": 8.564,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.43885117769241333,
"learning_rate": 3.45e-05,
"loss": 0.0654,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7045454545454546,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7741935483870968,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13700760900974274,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8227513227513227,
"eval_overall_precision": 0.7603911980440098,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3506,
"eval_samples_per_second": 533.416,
"eval_steps_per_second": 8.557,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.3841339647769928,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0639,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7108433734939759,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5841584158415841,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14966341853141785,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.81151832460733,
"eval_overall_precision": 0.7434052757793765,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.13,
"eval_steps_per_second": 8.569,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.86671382188797,
"learning_rate": 3.35e-05,
"loss": 0.0637,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9009584664536742,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13783931732177734,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.8213333333333332,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3499,
"eval_samples_per_second": 534.488,
"eval_steps_per_second": 8.575,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.8965917229652405,
"learning_rate": 3.3e-05,
"loss": 0.0625,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.759493670886076,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6451612903225806,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14487268030643463,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8333333333333334,
"eval_overall_precision": 0.7701711491442543,
"eval_overall_recall": 0.9077809798270894,
"eval_runtime": 0.3507,
"eval_samples_per_second": 533.265,
"eval_steps_per_second": 8.555,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.7054619193077087,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0634,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14537405967712402,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.821664464993395,
"eval_overall_precision": 0.7585365853658537,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.35,
"eval_samples_per_second": 534.224,
"eval_steps_per_second": 8.57,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.9769655466079712,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0592,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7672955974842768,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.648936170212766,
"eval_ORGANIZATION_recall": 0.9384615384615385,
"eval_PERSON_f1": 0.9067524115755627,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1611613929271698,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.8298429319371728,
"eval_overall_precision": 0.7601918465227818,
"eval_overall_recall": 0.9135446685878963,
"eval_runtime": 0.3514,
"eval_samples_per_second": 532.12,
"eval_steps_per_second": 8.537,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.828741192817688,
"learning_rate": 3.15e-05,
"loss": 0.0597,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7643312101910827,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6976744186046512,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7439024390243902,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6161616161616161,
"eval_ORGANIZATION_recall": 0.9384615384615385,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5777777777777777,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1625693291425705,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.8093385214007783,
"eval_overall_precision": 0.7358490566037735,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.713,
"eval_steps_per_second": 8.562,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 1.4891364574432373,
"learning_rate": 3.1e-05,
"loss": 0.0573,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8859934853420196,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7027027027027027,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1448131501674652,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8172043010752689,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.187,
"eval_steps_per_second": 8.57,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.5322253704071045,
"learning_rate": 3.05e-05,
"loss": 0.0561,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7643312101910829,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6521739130434783,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14745843410491943,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8243064729194188,
"eval_overall_precision": 0.7609756097560976,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3508,
"eval_samples_per_second": 533.023,
"eval_steps_per_second": 8.551,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 1.2674453258514404,
"learning_rate": 3e-05,
"loss": 0.0521,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7169811320754718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6063829787234043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7222222222222221,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14856770634651184,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8158940397350992,
"eval_overall_precision": 0.7549019607843137,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.717,
"eval_steps_per_second": 8.578,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.23710742592811584,
"learning_rate": 2.95e-05,
"loss": 0.0526,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7272727272727274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6363636363636364,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15941469371318817,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.8135593220338984,
"eval_overall_precision": 0.7428571428571429,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.713,
"eval_steps_per_second": 8.578,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.5749427080154419,
"learning_rate": 2.9e-05,
"loss": 0.0505,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8533333333333334,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1528312712907791,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8317631224764469,
"eval_overall_precision": 0.7803030303030303,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.466,
"eval_steps_per_second": 8.558,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.5371730923652649,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0497,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7006369426751592,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5978260869565217,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14798860251903534,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8068331143232589,
"eval_overall_precision": 0.7415458937198067,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.734,
"eval_steps_per_second": 8.579,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.9185490608215332,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0525,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8205128205128205,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6933333333333334,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6190476190476191,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15042471885681152,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8243064729194188,
"eval_overall_precision": 0.7609756097560976,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3507,
"eval_samples_per_second": 533.267,
"eval_steps_per_second": 8.555,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.4481260776519775,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0486,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14780230820178986,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8360215053763441,
"eval_overall_precision": 0.783375314861461,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3493,
"eval_samples_per_second": 535.387,
"eval_steps_per_second": 8.589,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.6384713053703308,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0454,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8311688311688312,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7710843373493976,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7272727272727273,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6292134831460674,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9155844155844156,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.732394366197183,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14535315334796906,
"eval_overall_accuracy": 0.9626576139670223,
"eval_overall_f1": 0.8342245989304813,
"eval_overall_precision": 0.7780548628428927,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3518,
"eval_samples_per_second": 531.582,
"eval_steps_per_second": 8.528,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 3.3819124698638916,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.049,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7108433734939759,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5841584158415841,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15948139131069183,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8188976377952757,
"eval_overall_precision": 0.7518072289156627,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.655,
"eval_steps_per_second": 8.593,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.692154049873352,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0467,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7272727272727273,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6292134831460674,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9090909090909091,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14814431965351105,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8255659121171772,
"eval_overall_precision": 0.7673267326732673,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.35,
"eval_samples_per_second": 534.257,
"eval_steps_per_second": 8.571,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.21525277197360992,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0458,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7450980392156863,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6477272727272727,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7027027027027027,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15645316243171692,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8293333333333333,
"eval_overall_precision": 0.771712158808933,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3516,
"eval_samples_per_second": 531.919,
"eval_steps_per_second": 8.533,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.6371389031410217,
"learning_rate": 2.5e-05,
"loss": 0.0435,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8258064516129031,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7619047619047619,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7105263157894737,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1588226705789566,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8266666666666667,
"eval_overall_precision": 0.7692307692307693,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3498,
"eval_samples_per_second": 534.657,
"eval_steps_per_second": 8.577,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.3768903613090515,
"learning_rate": 2.45e-05,
"loss": 0.0461,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7044025157232704,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5957446808510638,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16307169198989868,
"eval_overall_accuracy": 0.9558680892337537,
"eval_overall_f1": 0.8125819134993448,
"eval_overall_precision": 0.7451923076923077,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3494,
"eval_samples_per_second": 535.279,
"eval_steps_per_second": 8.587,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.7790448665618896,
"learning_rate": 2.4e-05,
"loss": 0.0424,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7215189873417722,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6129032258064516,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9155844155844156,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17204023897647858,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.8302387267904509,
"eval_overall_precision": 0.769041769041769,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3508,
"eval_samples_per_second": 533.066,
"eval_steps_per_second": 8.552,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.5764625072479248,
"learning_rate": 2.35e-05,
"loss": 0.0436,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8025477707006369,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7142857142857142,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5825242718446602,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.9102564102564102,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8765432098765432,
"eval_PERSON_recall": 0.9466666666666667,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1814979910850525,
"eval_overall_accuracy": 0.9529582929194956,
"eval_overall_f1": 0.8195876288659794,
"eval_overall_precision": 0.7412587412587412,
"eval_overall_recall": 0.9164265129682997,
"eval_runtime": 0.3501,
"eval_samples_per_second": 534.111,
"eval_steps_per_second": 8.569,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.7614324688911438,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0414,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7354838709677419,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6333333333333333,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1521797627210617,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8315508021390374,
"eval_overall_precision": 0.7755610972568578,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3503,
"eval_samples_per_second": 533.843,
"eval_steps_per_second": 8.564,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.6456512212753296,
"learning_rate": 2.25e-05,
"loss": 0.0413,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7450980392156863,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6477272727272727,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9019607843137256,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15478459000587463,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.834008097165992,
"eval_overall_precision": 0.7842639593908629,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3506,
"eval_samples_per_second": 533.435,
"eval_steps_per_second": 8.558,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 1.6711740493774414,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.04,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8496732026143791,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.9154929577464789,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1626283824443817,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8337801608579088,
"eval_overall_precision": 0.7794486215538847,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.35,
"eval_samples_per_second": 534.232,
"eval_steps_per_second": 8.571,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.47535088658332825,
"learning_rate": 2.15e-05,
"loss": 0.0416,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16426201164722443,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8299866131191432,
"eval_overall_precision": 0.775,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.703,
"eval_steps_per_second": 8.578,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.42809298634529114,
"learning_rate": 2.1e-05,
"loss": 0.0409,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8421052631578947,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7272727272727273,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6292134831460674,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6835443037974683,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5869565217391305,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15997961163520813,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8269484808454426,
"eval_overall_precision": 0.7634146341463415,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3495,
"eval_samples_per_second": 535.11,
"eval_steps_per_second": 8.585,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 1.3752318620681763,
"learning_rate": 2.05e-05,
"loss": 0.0392,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1547561138868332,
"eval_overall_accuracy": 0.9599903006789525,
"eval_overall_f1": 0.8232118758434548,
"eval_overall_precision": 0.7741116751269036,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3499,
"eval_samples_per_second": 534.45,
"eval_steps_per_second": 8.574,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.807634711265564,
"learning_rate": 2e-05,
"loss": 0.0374,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8476821192052981,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8928571428571429,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15809109807014465,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8394062078272604,
"eval_overall_precision": 0.7893401015228426,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.596,
"eval_steps_per_second": 8.56,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.2931790351867676,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0365,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8421052631578947,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7515923566878981,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6413043478260869,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16991622745990753,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8411214953271029,
"eval_overall_precision": 0.7835820895522388,
"eval_overall_recall": 0.9077809798270894,
"eval_runtime": 0.3512,
"eval_samples_per_second": 532.476,
"eval_steps_per_second": 8.542,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.6080542802810669,
"learning_rate": 1.9e-05,
"loss": 0.0367,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8441558441558441,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7831325301204819,
"eval_LOCATION_recall": 0.9154929577464789,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8859934853420196,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1723637729883194,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8317631224764469,
"eval_overall_precision": 0.7803030303030303,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.569,
"eval_steps_per_second": 8.592,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.6744797825813293,
"learning_rate": 1.85e-05,
"loss": 0.0365,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7169811320754718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6063829787234043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16163378953933716,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8244680851063829,
"eval_overall_precision": 0.7654320987654321,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3516,
"eval_samples_per_second": 531.858,
"eval_steps_per_second": 8.532,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.468826025724411,
"learning_rate": 1.8e-05,
"loss": 0.0355,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7534246575342466,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6790123456790124,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17165683209896088,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.824,
"eval_overall_precision": 0.7667493796526055,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3518,
"eval_samples_per_second": 531.527,
"eval_steps_per_second": 8.527,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 1.1759960651397705,
"learning_rate": 1.75e-05,
"loss": 0.0372,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8258064516129031,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7619047619047619,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16856727004051208,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8308921438082557,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3518,
"eval_samples_per_second": 531.563,
"eval_steps_per_second": 8.528,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.6541854739189148,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0362,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.728395061728395,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6082474226804123,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18290750682353973,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.8241469816272966,
"eval_overall_precision": 0.7566265060240964,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3503,
"eval_samples_per_second": 533.882,
"eval_steps_per_second": 8.565,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.5697064995765686,
"learning_rate": 1.65e-05,
"loss": 0.0333,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7388535031847134,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6304347826086957,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17202883958816528,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8320000000000001,
"eval_overall_precision": 0.7741935483870968,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3506,
"eval_samples_per_second": 533.421,
"eval_steps_per_second": 8.558,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.7047253251075745,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.033,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8258064516129031,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7619047619047619,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7307692307692307,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6263736263736264,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16683901846408844,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8313413014608233,
"eval_overall_precision": 0.770935960591133,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.689,
"eval_steps_per_second": 8.578,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.8004153370857239,
"learning_rate": 1.55e-05,
"loss": 0.0333,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8441558441558441,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7831325301204819,
"eval_LOCATION_recall": 0.9154929577464789,
"eval_ORGANIZATION_f1": 0.7261146496815286,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6195652173913043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1638197898864746,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8351063829787235,
"eval_overall_precision": 0.7753086419753087,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3527,
"eval_samples_per_second": 530.148,
"eval_steps_per_second": 8.505,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.29508113861083984,
"learning_rate": 1.5e-05,
"loss": 0.0335,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8496732026143791,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.9154929577464789,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6551724137931034,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17051611840724945,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8380187416331996,
"eval_overall_precision": 0.7825,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3495,
"eval_samples_per_second": 535.056,
"eval_steps_per_second": 8.584,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 1.538805365562439,
"learning_rate": 1.45e-05,
"loss": 0.0353,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7080745341614907,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.59375,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19078566133975983,
"eval_overall_accuracy": 0.9544131910766246,
"eval_overall_f1": 0.814621409921671,
"eval_overall_precision": 0.7446300715990454,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3503,
"eval_samples_per_second": 533.879,
"eval_steps_per_second": 8.565,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.9210314750671387,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0324,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1728380173444748,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8277703604806409,
"eval_overall_precision": 0.7711442786069652,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3513,
"eval_samples_per_second": 532.244,
"eval_steps_per_second": 8.539,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.4661843776702881,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0323,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7388535031847134,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6304347826086957,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17989809811115265,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8260292164674636,
"eval_overall_precision": 0.7660098522167488,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.723,
"eval_steps_per_second": 8.578,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.6226832866668701,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0321,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1787552833557129,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8277703604806409,
"eval_overall_precision": 0.7711442786069652,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3512,
"eval_samples_per_second": 532.488,
"eval_steps_per_second": 8.543,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.3848640024662018,
"learning_rate": 1.25e-05,
"loss": 0.0296,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18127557635307312,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.827127659574468,
"eval_overall_precision": 0.7679012345679013,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3512,
"eval_samples_per_second": 532.43,
"eval_steps_per_second": 8.542,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.07505329698324203,
"learning_rate": 1.2e-05,
"loss": 0.0308,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7169811320754718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6063829787234043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8888888888888887,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17781808972358704,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8277703604806409,
"eval_overall_precision": 0.7711442786069652,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.468,
"eval_steps_per_second": 8.558,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 1.183031439781189,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0305,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7199999999999999,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6352941176470588,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18227067589759827,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8262032085561497,
"eval_overall_precision": 0.770573566084788,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3499,
"eval_samples_per_second": 534.482,
"eval_steps_per_second": 8.575,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.4748055636882782,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0298,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8387096774193548,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7738095238095238,
"eval_LOCATION_recall": 0.9154929577464789,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1802036613225937,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8315508021390374,
"eval_overall_precision": 0.7755610972568578,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3497,
"eval_samples_per_second": 534.703,
"eval_steps_per_second": 8.578,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 1.2819609642028809,
"learning_rate": 1.05e-05,
"loss": 0.0302,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8205128205128205,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18992583453655243,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8286852589641435,
"eval_overall_precision": 0.7684729064039408,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3507,
"eval_samples_per_second": 533.193,
"eval_steps_per_second": 8.554,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.5597596168518066,
"learning_rate": 1e-05,
"loss": 0.0307,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8533333333333334,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7066666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6842105263157895,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6046511627906976,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18140378594398499,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8230563002680964,
"eval_overall_precision": 0.7694235588972431,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.729,
"eval_steps_per_second": 8.562,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.40338334441185,
"learning_rate": 9.5e-06,
"loss": 0.0275,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7058823529411765,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6136363636363636,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18396371603012085,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8262032085561497,
"eval_overall_precision": 0.770573566084788,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3499,
"eval_samples_per_second": 534.509,
"eval_steps_per_second": 8.575,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.6464970111846924,
"learning_rate": 9e-06,
"loss": 0.0285,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8496732026143791,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.9154929577464789,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6179775280898876,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18916206061840057,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8255659121171772,
"eval_overall_precision": 0.7673267326732673,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3508,
"eval_samples_per_second": 533.079,
"eval_steps_per_second": 8.552,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.22236359119415283,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0303,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7051282051282052,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6043956043956044,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18220850825309753,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8207171314741034,
"eval_overall_precision": 0.7610837438423645,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3506,
"eval_samples_per_second": 533.426,
"eval_steps_per_second": 8.558,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.35181981325149536,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0291,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1842212826013565,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.8164893617021276,
"eval_overall_precision": 0.7580246913580246,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3505,
"eval_samples_per_second": 533.572,
"eval_steps_per_second": 8.56,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.7243216037750244,
"learning_rate": 7.5e-06,
"loss": 0.0275,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8311688311688312,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7710843373493976,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18761229515075684,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8191489361702129,
"eval_overall_precision": 0.7604938271604939,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3509,
"eval_samples_per_second": 532.932,
"eval_steps_per_second": 8.55,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.5909172296524048,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0286,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8311688311688312,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7710843373493976,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7388535031847134,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6304347826086957,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8954248366013071,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1853346824645996,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8282290279627165,
"eval_overall_precision": 0.7698019801980198,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3502,
"eval_samples_per_second": 533.924,
"eval_steps_per_second": 8.566,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.7483916878700256,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0283,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7295597484276729,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6170212765957447,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1859874278306961,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8244680851063829,
"eval_overall_precision": 0.7654320987654321,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3491,
"eval_samples_per_second": 535.601,
"eval_steps_per_second": 8.593,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.6192948222160339,
"learning_rate": 6e-06,
"loss": 0.0278,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7354838709677419,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6333333333333333,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1810171753168106,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8315508021390374,
"eval_overall_precision": 0.7755610972568578,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3504,
"eval_samples_per_second": 533.64,
"eval_steps_per_second": 8.561,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.5605934858322144,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0277,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8421052631578947,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7124999999999999,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18933603167533875,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.820580474934037,
"eval_overall_precision": 0.7566909975669099,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3526,
"eval_samples_per_second": 530.391,
"eval_steps_per_second": 8.509,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.2893717586994171,
"learning_rate": 5e-06,
"loss": 0.0274,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6179775280898876,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7123287671232875,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18061868846416473,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8176943699731903,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3513,
"eval_samples_per_second": 532.297,
"eval_steps_per_second": 8.54,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.9740373492240906,
"learning_rate": 4.5e-06,
"loss": 0.0262,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.708860759493671,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6021505376344086,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18925167620182037,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.8100263852242744,
"eval_overall_precision": 0.7469586374695864,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3493,
"eval_samples_per_second": 535.417,
"eval_steps_per_second": 8.59,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.1865842491388321,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0263,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7466666666666668,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6588235294117647,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7123287671232875,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18539157509803772,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8203753351206434,
"eval_overall_precision": 0.7669172932330827,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3492,
"eval_samples_per_second": 535.496,
"eval_steps_per_second": 8.591,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.1964859962463379,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0253,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.713375796178344,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.189639613032341,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8158940397350992,
"eval_overall_precision": 0.7549019607843137,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.351,
"eval_samples_per_second": 532.764,
"eval_steps_per_second": 8.547,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.6065542101860046,
"learning_rate": 3e-06,
"loss": 0.0246,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.713375796178344,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8766233766233766,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18659386038780212,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8144192256341789,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3514,
"eval_samples_per_second": 532.142,
"eval_steps_per_second": 8.537,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.47104644775390625,
"learning_rate": 2.5e-06,
"loss": 0.0277,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7368421052631579,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6436781609195402,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8737864077669903,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18918968737125397,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8155080213903744,
"eval_overall_precision": 0.7605985037406484,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3518,
"eval_samples_per_second": 531.589,
"eval_steps_per_second": 8.528,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.6074219346046448,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0261,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.717948717948718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18794935941696167,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8175765645805593,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3495,
"eval_samples_per_second": 534.995,
"eval_steps_per_second": 8.583,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.5106649398803711,
"learning_rate": 1.5e-06,
"loss": 0.025,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18944178521633148,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.816,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3495,
"eval_samples_per_second": 535.094,
"eval_steps_per_second": 8.584,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.6887297034263611,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0257,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.713375796178344,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19144974648952484,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8148148148148148,
"eval_overall_precision": 0.7530562347188264,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3502,
"eval_samples_per_second": 533.939,
"eval_steps_per_second": 8.566,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.14230668544769287,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0274,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.713375796178344,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19010868668556213,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8158940397350992,
"eval_overall_precision": 0.7549019607843137,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3511,
"eval_samples_per_second": 532.588,
"eval_steps_per_second": 8.544,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.5434573292732239,
"learning_rate": 0.0,
"loss": 0.0256,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.717948717948718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18971124291419983,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.816976127320955,
"eval_overall_precision": 0.7567567567567568,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3511,
"eval_samples_per_second": 532.586,
"eval_steps_per_second": 8.544,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5123217774191952.0,
"train_loss": 0.07423505819068765,
"train_runtime": 606.268,
"train_samples_per_second": 278.425,
"train_steps_per_second": 17.484
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5123217774191952.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}