nerugm-seq_bn-rf16-3 / trainer_state.json
apwic's picture
End of training
fc0b73c verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 2.184743642807007,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9441,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.013071895424836602,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.3333333333333333,
"eval_PERSON_recall": 0.006666666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.6184682846069336,
"eval_overall_accuracy": 0.8414161008729389,
"eval_overall_f1": 0.005714285714285714,
"eval_overall_precision": 0.3333333333333333,
"eval_overall_recall": 0.002881844380403458,
"eval_runtime": 0.3392,
"eval_samples_per_second": 551.333,
"eval_steps_per_second": 8.845,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.0305746793746948,
"learning_rate": 4.9e-05,
"loss": 0.5645,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.22916666666666669,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.44,
"eval_LOCATION_recall": 0.15492957746478872,
"eval_ORGANIZATION_f1": 0.04,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.05714285714285714,
"eval_ORGANIZATION_recall": 0.03076923076923077,
"eval_PERSON_f1": 0.5449438202247192,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.470873786407767,
"eval_PERSON_recall": 0.6466666666666666,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.43478260869565216,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.5555555555555556,
"eval_TIME_recall": 0.35714285714285715,
"eval_loss": 0.41943466663360596,
"eval_overall_accuracy": 0.8877303588748787,
"eval_overall_f1": 0.3803486529318542,
"eval_overall_precision": 0.4225352112676056,
"eval_overall_recall": 0.345821325648415,
"eval_runtime": 0.3288,
"eval_samples_per_second": 568.708,
"eval_steps_per_second": 9.124,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.2039958238601685,
"learning_rate": 4.85e-05,
"loss": 0.3968,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.5153374233128835,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.45652173913043476,
"eval_LOCATION_recall": 0.5915492957746479,
"eval_ORGANIZATION_f1": 0.3278688524590164,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.3508771929824561,
"eval_ORGANIZATION_recall": 0.3076923076923077,
"eval_PERSON_f1": 0.6829268292682927,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.5753424657534246,
"eval_PERSON_recall": 0.84,
"eval_QUANTITY_f1": 0.1846153846153846,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.1875,
"eval_QUANTITY_recall": 0.18181818181818182,
"eval_TIME_f1": 0.8076923076923077,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.75,
"eval_loss": 0.30941861867904663,
"eval_overall_accuracy": 0.9202230843840931,
"eval_overall_f1": 0.5577172503242542,
"eval_overall_precision": 0.5070754716981132,
"eval_overall_recall": 0.6195965417867435,
"eval_runtime": 0.3381,
"eval_samples_per_second": 553.069,
"eval_steps_per_second": 8.873,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 4.7056145668029785,
"learning_rate": 4.8e-05,
"loss": 0.2937,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.5465116279069767,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.46534653465346537,
"eval_LOCATION_recall": 0.6619718309859155,
"eval_ORGANIZATION_f1": 0.4878048780487805,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5172413793103449,
"eval_ORGANIZATION_recall": 0.46153846153846156,
"eval_PERSON_f1": 0.8036809815950918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7443181818181818,
"eval_PERSON_recall": 0.8733333333333333,
"eval_QUANTITY_f1": 0.47368421052631576,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.4186046511627907,
"eval_QUANTITY_recall": 0.5454545454545454,
"eval_TIME_f1": 0.8363636363636364,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.2222605049610138,
"eval_overall_accuracy": 0.9369544131910766,
"eval_overall_f1": 0.6622340425531915,
"eval_overall_precision": 0.6148148148148148,
"eval_overall_recall": 0.7175792507204611,
"eval_runtime": 0.3282,
"eval_samples_per_second": 569.698,
"eval_steps_per_second": 9.14,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.303191900253296,
"learning_rate": 4.75e-05,
"loss": 0.2294,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.6496815286624205,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5930232558139535,
"eval_LOCATION_recall": 0.7183098591549296,
"eval_ORGANIZATION_f1": 0.562962962962963,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5428571428571428,
"eval_ORGANIZATION_recall": 0.5846153846153846,
"eval_PERSON_f1": 0.8176100628930819,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7738095238095238,
"eval_PERSON_recall": 0.8666666666666667,
"eval_QUANTITY_f1": 0.5316455696202532,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.45652173913043476,
"eval_QUANTITY_recall": 0.6363636363636364,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.18041133880615234,
"eval_overall_accuracy": 0.9427740058195926,
"eval_overall_f1": 0.7106325706594886,
"eval_overall_precision": 0.6666666666666666,
"eval_overall_recall": 0.760806916426513,
"eval_runtime": 0.3291,
"eval_samples_per_second": 568.165,
"eval_steps_per_second": 9.115,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.6567788124084473,
"learning_rate": 4.7e-05,
"loss": 0.1955,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7052023121387284,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5980392156862745,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.5903614457831325,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.48514851485148514,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8109756097560976,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7471910112359551,
"eval_PERSON_recall": 0.8866666666666667,
"eval_QUANTITY_f1": 0.5517241379310345,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.4444444444444444,
"eval_QUANTITY_recall": 0.7272727272727273,
"eval_TIME_f1": 0.793103448275862,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.19565138220787048,
"eval_overall_accuracy": 0.9396217264791464,
"eval_overall_f1": 0.7142857142857143,
"eval_overall_precision": 0.6236559139784946,
"eval_overall_recall": 0.8357348703170029,
"eval_runtime": 0.3291,
"eval_samples_per_second": 568.21,
"eval_steps_per_second": 9.116,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 2.8131422996520996,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1799,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7374999999999999,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6629213483146067,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.6482758620689656,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5875,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.81875,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7705882352941177,
"eval_PERSON_recall": 0.8733333333333333,
"eval_QUANTITY_f1": 0.6585365853658536,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5510204081632653,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16057299077510834,
"eval_overall_accuracy": 0.9468962172647915,
"eval_overall_f1": 0.7529411764705883,
"eval_overall_precision": 0.6889952153110048,
"eval_overall_recall": 0.829971181556196,
"eval_runtime": 0.3295,
"eval_samples_per_second": 567.569,
"eval_steps_per_second": 9.105,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.7265537977218628,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1628,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7349397590361445,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6421052631578947,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.6451612903225806,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5555555555555556,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8275862068965518,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7810650887573964,
"eval_PERSON_recall": 0.88,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15270720422267914,
"eval_overall_accuracy": 0.9510184287099903,
"eval_overall_f1": 0.7587096774193549,
"eval_overall_precision": 0.6869158878504673,
"eval_overall_recall": 0.8472622478386167,
"eval_runtime": 0.3291,
"eval_samples_per_second": 568.147,
"eval_steps_per_second": 9.115,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.15663743019104,
"learning_rate": 4.55e-05,
"loss": 0.1528,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7564102564102564,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6941176470588235,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.6351351351351351,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5662650602409639,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8397435897435898,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.808641975308642,
"eval_PERSON_recall": 0.8733333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14164027571678162,
"eval_overall_accuracy": 0.9522308438409312,
"eval_overall_f1": 0.7727272727272728,
"eval_overall_precision": 0.7206982543640897,
"eval_overall_recall": 0.8328530259365994,
"eval_runtime": 0.3351,
"eval_samples_per_second": 558.073,
"eval_steps_per_second": 8.953,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.8798385858535767,
"learning_rate": 4.5e-05,
"loss": 0.1466,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7307692307692307,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6705882352941176,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.625,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.569620253164557,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8387096774193549,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8125,
"eval_PERSON_recall": 0.8666666666666667,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14073340594768524,
"eval_overall_accuracy": 0.9522308438409312,
"eval_overall_f1": 0.7661290322580645,
"eval_overall_precision": 0.7178841309823678,
"eval_overall_recall": 0.8213256484149856,
"eval_runtime": 0.3345,
"eval_samples_per_second": 559.032,
"eval_steps_per_second": 8.968,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.9395531415939331,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.138,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.775,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5975609756097561,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8360128617363344,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8074534161490683,
"eval_PERSON_recall": 0.8666666666666667,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14058995246887207,
"eval_overall_accuracy": 0.9536857419980601,
"eval_overall_f1": 0.7819148936170213,
"eval_overall_precision": 0.725925925925926,
"eval_overall_recall": 0.8472622478386167,
"eval_runtime": 0.3303,
"eval_samples_per_second": 566.135,
"eval_steps_per_second": 9.082,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.2153416872024536,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1314,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.775,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6578947368421053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5747126436781609,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8407643312101911,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8048780487804879,
"eval_PERSON_recall": 0.88,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14196860790252686,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.7769028871391075,
"eval_overall_precision": 0.7132530120481928,
"eval_overall_recall": 0.8530259365994236,
"eval_runtime": 0.3295,
"eval_samples_per_second": 567.586,
"eval_steps_per_second": 9.106,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.6423377990722656,
"learning_rate": 4.35e-05,
"loss": 0.1285,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7261146496815286,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6627906976744186,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.6493506493506495,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5617977528089888,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8461538461538461,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8148148148148148,
"eval_PERSON_recall": 0.88,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.9090909090909091,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9259259259259259,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13416315615177155,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.7755644090305446,
"eval_overall_precision": 0.7192118226600985,
"eval_overall_recall": 0.8414985590778098,
"eval_runtime": 0.3353,
"eval_samples_per_second": 557.743,
"eval_steps_per_second": 8.948,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 3.325246572494507,
"learning_rate": 4.3e-05,
"loss": 0.1301,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.5915492957746479,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5454545454545454,
"eval_ORGANIZATION_recall": 0.6461538461538462,
"eval_PERSON_f1": 0.8488745980707395,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8198757763975155,
"eval_PERSON_recall": 0.88,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12784981727600098,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.778833107191316,
"eval_overall_precision": 0.735897435897436,
"eval_overall_recall": 0.8270893371757925,
"eval_runtime": 0.3291,
"eval_samples_per_second": 568.237,
"eval_steps_per_second": 9.116,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.1983723640441895,
"learning_rate": 4.25e-05,
"loss": 0.1197,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7045454545454546,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7012987012987013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6067415730337079,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8471337579617835,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8109756097560976,
"eval_PERSON_recall": 0.8866666666666667,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1395217925310135,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.7874015748031495,
"eval_overall_precision": 0.7228915662650602,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.3284,
"eval_samples_per_second": 569.403,
"eval_steps_per_second": 9.135,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 2.9908885955810547,
"learning_rate": 4.2e-05,
"loss": 0.1147,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6853146853146853,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6282051282051282,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8461538461538461,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8148148148148148,
"eval_PERSON_recall": 0.88,
"eval_QUANTITY_f1": 0.7088607594936709,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6086956521739131,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13548891246318817,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.787716955941255,
"eval_overall_precision": 0.7338308457711443,
"eval_overall_recall": 0.8501440922190202,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.383,
"eval_steps_per_second": 8.974,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.7757030129432678,
"learning_rate": 4.15e-05,
"loss": 0.1134,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.6618705035971223,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6216216216216216,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8498402555910542,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8159509202453987,
"eval_PERSON_recall": 0.8866666666666667,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12935349345207214,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.7875507442489851,
"eval_overall_precision": 0.7423469387755102,
"eval_overall_recall": 0.8386167146974063,
"eval_runtime": 0.3301,
"eval_samples_per_second": 566.53,
"eval_steps_per_second": 9.089,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 1.1819586753845215,
"learning_rate": 4.1e-05,
"loss": 0.1103,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7162162162162162,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8507936507936508,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8121212121212121,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13496747612953186,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8015978695073236,
"eval_overall_precision": 0.745049504950495,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3289,
"eval_samples_per_second": 568.537,
"eval_steps_per_second": 9.121,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 1.253257393836975,
"learning_rate": 4.05e-05,
"loss": 0.1078,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7162162162162162,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8498402555910542,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8159509202453987,
"eval_PERSON_recall": 0.8866666666666667,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13079425692558289,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.7999999999999999,
"eval_overall_precision": 0.7487437185929648,
"eval_overall_recall": 0.8587896253602305,
"eval_runtime": 0.3341,
"eval_samples_per_second": 559.714,
"eval_steps_per_second": 8.979,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.522292137145996,
"learning_rate": 4e-05,
"loss": 0.1051,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6814814814814816,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6571428571428571,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.858974358974359,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8271604938271605,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12830358743667603,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8054794520547945,
"eval_overall_precision": 0.7676240208877284,
"eval_overall_recall": 0.8472622478386167,
"eval_runtime": 0.3284,
"eval_samples_per_second": 569.369,
"eval_steps_per_second": 9.134,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.3046311140060425,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.1013,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8507936507936508,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8121212121212121,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1330733597278595,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8048128342245989,
"eval_overall_precision": 0.7506234413965087,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.335,
"eval_samples_per_second": 558.137,
"eval_steps_per_second": 8.954,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 1.648231863975525,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.1015,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.7625,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6853932584269663,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7044025157232704,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5957446808510638,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8481012658227848,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8072289156626506,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1461816430091858,
"eval_overall_accuracy": 0.9529582929194956,
"eval_overall_f1": 0.7900912646675358,
"eval_overall_precision": 0.7214285714285714,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3294,
"eval_samples_per_second": 567.654,
"eval_steps_per_second": 9.107,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 1.236881136894226,
"learning_rate": 3.85e-05,
"loss": 0.0952,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7375886524822695,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8525641025641025,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.8866666666666667,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12616348266601562,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8180574555403557,
"eval_overall_precision": 0.7786458333333334,
"eval_overall_recall": 0.861671469740634,
"eval_runtime": 0.3359,
"eval_samples_per_second": 556.671,
"eval_steps_per_second": 8.931,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.727121353149414,
"learning_rate": 3.8e-05,
"loss": 0.0957,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7105263157894737,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8454258675078864,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8023952095808383,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14105214178562164,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.7962962962962963,
"eval_overall_precision": 0.7359413202933985,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3291,
"eval_samples_per_second": 568.152,
"eval_steps_per_second": 9.115,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 1.6316332817077637,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0913,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7534246575342466,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6790123456790124,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8544303797468354,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8132530120481928,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6363636363636364,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13811782002449036,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8117489986648865,
"eval_overall_precision": 0.7562189054726368,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3289,
"eval_samples_per_second": 568.489,
"eval_steps_per_second": 9.12,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.5518941879272461,
"learning_rate": 3.7e-05,
"loss": 0.091,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7361111111111112,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6708860759493671,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8643533123028392,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8203592814371258,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7179487179487178,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6222222222222222,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13771426677703857,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.808,
"eval_overall_precision": 0.7518610421836228,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.442,
"eval_steps_per_second": 8.975,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 1.4636467695236206,
"learning_rate": 3.65e-05,
"loss": 0.0902,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7770700636942676,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7248322147651007,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8517350157728706,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8083832335329342,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6582278481012658,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5652173913043478,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14399109780788422,
"eval_overall_accuracy": 0.9546556741028128,
"eval_overall_f1": 0.7894736842105263,
"eval_overall_precision": 0.7263922518159807,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.3358,
"eval_samples_per_second": 556.812,
"eval_steps_per_second": 8.933,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.3473738431930542,
"learning_rate": 3.6e-05,
"loss": 0.087,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6179775280898876,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8626198083067093,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8282208588957055,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1355486363172531,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8118279569892473,
"eval_overall_precision": 0.760705289672544,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3366,
"eval_samples_per_second": 555.494,
"eval_steps_per_second": 8.912,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.5319921970367432,
"learning_rate": 3.55e-05,
"loss": 0.0849,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.6923076923076923,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5934065934065934,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8507936507936508,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8121212121212121,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13350827991962433,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.7989347536617842,
"eval_overall_precision": 0.7425742574257426,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.3368,
"eval_samples_per_second": 555.248,
"eval_steps_per_second": 8.908,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.0683906078338623,
"learning_rate": 3.5e-05,
"loss": 0.0815,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7310344827586207,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6625,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13375303149223328,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8184281842818427,
"eval_overall_precision": 0.7723785166240409,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3368,
"eval_samples_per_second": 555.175,
"eval_steps_per_second": 8.907,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.8525239825248718,
"learning_rate": 3.45e-05,
"loss": 0.0838,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13723136484622955,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8133333333333335,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.334,
"eval_samples_per_second": 559.823,
"eval_steps_per_second": 8.981,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 1.4616408348083496,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.076,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7770700636942676,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.708860759493671,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6021505376344086,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8643533123028392,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8203592814371258,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7088607594936709,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6086956521739131,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1504770815372467,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.7989556135770235,
"eval_overall_precision": 0.7303102625298329,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3282,
"eval_samples_per_second": 569.822,
"eval_steps_per_second": 9.142,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 2.1258466243743896,
"learning_rate": 3.35e-05,
"loss": 0.0775,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.72992700729927,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6944444444444444,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13078542053699493,
"eval_overall_accuracy": 0.9633850630455868,
"eval_overall_f1": 0.8264462809917356,
"eval_overall_precision": 0.7915567282321899,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.3348,
"eval_samples_per_second": 558.49,
"eval_steps_per_second": 8.96,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.6660958528518677,
"learning_rate": 3.3e-05,
"loss": 0.0768,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8681672025723473,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13354364037513733,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8254397834912043,
"eval_overall_precision": 0.7780612244897959,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3339,
"eval_samples_per_second": 560.029,
"eval_steps_per_second": 8.984,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.7892407774925232,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0746,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7549668874172185,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6627906976744186,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1393873244524002,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8225806451612904,
"eval_overall_precision": 0.7707808564231738,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3337,
"eval_samples_per_second": 560.376,
"eval_steps_per_second": 8.99,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.38412344455719,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0724,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7051282051282052,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6043956043956044,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8589341692789968,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8106508875739645,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14194774627685547,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8110964332892999,
"eval_overall_precision": 0.748780487804878,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3344,
"eval_samples_per_second": 559.292,
"eval_steps_per_second": 8.973,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 1.6571606397628784,
"learning_rate": 3.15e-05,
"loss": 0.0703,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6931818181818182,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.708860759493671,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6021505376344086,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15663577616214752,
"eval_overall_accuracy": 0.9517458777885548,
"eval_overall_f1": 0.7973856209150326,
"eval_overall_precision": 0.7296650717703349,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3366,
"eval_samples_per_second": 555.525,
"eval_steps_per_second": 8.912,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.8099401593208313,
"learning_rate": 3.1e-05,
"loss": 0.07,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7770700636942676,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6835443037974683,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5869565217391305,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14580821990966797,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8090185676392573,
"eval_overall_precision": 0.7493857493857494,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3346,
"eval_samples_per_second": 558.844,
"eval_steps_per_second": 8.965,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 1.7465280294418335,
"learning_rate": 3.05e-05,
"loss": 0.0688,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.713375796178344,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14488695561885834,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8158940397350992,
"eval_overall_precision": 0.7549019607843137,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3336,
"eval_samples_per_second": 560.471,
"eval_steps_per_second": 8.992,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.8754693269729614,
"learning_rate": 3e-05,
"loss": 0.0691,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7448275862068966,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.675,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7887323943661972,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13563859462738037,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8281461434370772,
"eval_overall_precision": 0.7806122448979592,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3295,
"eval_samples_per_second": 567.559,
"eval_steps_per_second": 9.105,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.3340809941291809,
"learning_rate": 2.95e-05,
"loss": 0.0673,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.6962025316455697,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5913978494623656,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15314164757728577,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.7958115183246073,
"eval_overall_precision": 0.7290167865707434,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3349,
"eval_samples_per_second": 558.392,
"eval_steps_per_second": 8.958,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.9933107495307922,
"learning_rate": 2.9e-05,
"loss": 0.0663,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8653846153846153,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1424974650144577,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8144192256341789,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3341,
"eval_samples_per_second": 559.709,
"eval_steps_per_second": 8.979,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.6678488254547119,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0639,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7285714285714285,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.68,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8562300319488818,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8220858895705522,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1413319855928421,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8113975576662144,
"eval_overall_precision": 0.7666666666666667,
"eval_overall_recall": 0.861671469740634,
"eval_runtime": 0.3285,
"eval_samples_per_second": 569.242,
"eval_steps_per_second": 9.132,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.8438284993171692,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.064,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7152317880794703,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.627906976744186,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14022959768772125,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8187919463087249,
"eval_overall_precision": 0.7663316582914573,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3337,
"eval_samples_per_second": 560.437,
"eval_steps_per_second": 8.991,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 3.699862241744995,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0615,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15338602662086487,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.8042328042328041,
"eval_overall_precision": 0.7432762836185819,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.329,
"eval_samples_per_second": 568.326,
"eval_steps_per_second": 9.118,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.7766585946083069,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0614,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7887323943661972,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14268124103546143,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8221024258760108,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.326,
"eval_steps_per_second": 8.973,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 1.664536476135254,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0595,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.154044508934021,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8174603174603176,
"eval_overall_precision": 0.7555012224938875,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3363,
"eval_samples_per_second": 555.98,
"eval_steps_per_second": 8.919,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 1.3004956245422363,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0594,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1491357684135437,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8154050464807437,
"eval_overall_precision": 0.7561576354679803,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3302,
"eval_samples_per_second": 566.352,
"eval_steps_per_second": 9.086,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 1.524907112121582,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0579,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.697986577181208,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14881013333797455,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8095872170439414,
"eval_overall_precision": 0.7524752475247525,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.754,
"eval_steps_per_second": 8.964,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.4106496572494507,
"learning_rate": 2.5e-05,
"loss": 0.0561,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6933333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.611764705882353,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7887323943661972,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1435040831565857,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8151147098515519,
"eval_overall_precision": 0.766497461928934,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3346,
"eval_samples_per_second": 558.815,
"eval_steps_per_second": 8.965,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.9782974123954773,
"learning_rate": 2.45e-05,
"loss": 0.056,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6891891891891891,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6144578313253012,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15163768827915192,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.808,
"eval_overall_precision": 0.7518610421836228,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3285,
"eval_samples_per_second": 569.298,
"eval_steps_per_second": 9.133,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.8598395586013794,
"learning_rate": 2.4e-05,
"loss": 0.0547,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15105435252189636,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8091397849462366,
"eval_overall_precision": 0.7581863979848866,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3341,
"eval_samples_per_second": 559.773,
"eval_steps_per_second": 8.98,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.4993176460266113,
"learning_rate": 2.35e-05,
"loss": 0.0534,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.713375796178344,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16154761612415314,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.8068331143232589,
"eval_overall_precision": 0.7415458937198067,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3295,
"eval_samples_per_second": 567.521,
"eval_steps_per_second": 9.105,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 1.0407500267028809,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0526,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6967741935483871,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15213675796985626,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8155080213903744,
"eval_overall_precision": 0.7605985037406484,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3348,
"eval_samples_per_second": 558.56,
"eval_steps_per_second": 8.961,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.6406387686729431,
"learning_rate": 2.25e-05,
"loss": 0.0538,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7875000000000001,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7078651685393258,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7051282051282052,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6043956043956044,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15997092425823212,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8015768725361366,
"eval_overall_precision": 0.7367149758454107,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3348,
"eval_samples_per_second": 558.524,
"eval_steps_per_second": 8.96,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 2.387361526489258,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0529,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7096774193548387,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1578657031059265,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8095238095238096,
"eval_overall_precision": 0.7481662591687042,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.336,
"eval_samples_per_second": 556.493,
"eval_steps_per_second": 8.928,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 1.3003697395324707,
"learning_rate": 2.15e-05,
"loss": 0.05,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6950354609929077,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6447368421052632,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14940249919891357,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8185538881309686,
"eval_overall_precision": 0.7772020725388601,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.3282,
"eval_samples_per_second": 569.855,
"eval_steps_per_second": 9.142,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.7399232387542725,
"learning_rate": 2.1e-05,
"loss": 0.0512,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7042253521126761,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6493506493506493,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7887323943661972,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14740602672100067,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.8163265306122449,
"eval_overall_precision": 0.7731958762886598,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.335,
"eval_samples_per_second": 558.203,
"eval_steps_per_second": 8.955,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 1.4280949831008911,
"learning_rate": 2.05e-05,
"loss": 0.047,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7248322147651007,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15319204330444336,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8187919463087249,
"eval_overall_precision": 0.7663316582914573,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3345,
"eval_samples_per_second": 558.972,
"eval_steps_per_second": 8.967,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 1.479651689529419,
"learning_rate": 2e-05,
"loss": 0.047,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7096774193548387,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15390989184379578,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8176943699731903,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3361,
"eval_samples_per_second": 556.409,
"eval_steps_per_second": 8.926,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.868341326713562,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0465,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7105263157894737,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7887323943661972,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15987202525138855,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.816,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3357,
"eval_samples_per_second": 557.069,
"eval_steps_per_second": 8.937,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 1.9663652181625366,
"learning_rate": 1.9e-05,
"loss": 0.045,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1569298505783081,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8176943699731903,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.334,
"eval_samples_per_second": 559.847,
"eval_steps_per_second": 8.982,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 4.453447341918945,
"learning_rate": 1.85e-05,
"loss": 0.0468,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7114093959731543,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6309523809523809,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7887323943661972,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1518780142068863,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8195386702849389,
"eval_overall_precision": 0.7743589743589744,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.764,
"eval_steps_per_second": 8.964,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.6715424656867981,
"learning_rate": 1.8e-05,
"loss": 0.0446,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7272727272727272,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15471045672893524,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8201634877384196,
"eval_overall_precision": 0.7777777777777778,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.76,
"eval_steps_per_second": 8.964,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 1.4069435596466064,
"learning_rate": 1.75e-05,
"loss": 0.0452,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7051282051282052,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6043956043956044,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16312921047210693,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8149134487350199,
"eval_overall_precision": 0.7574257425742574,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3337,
"eval_samples_per_second": 560.419,
"eval_steps_per_second": 8.991,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.9711624383926392,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0442,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7051282051282052,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6043956043956044,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1615941822528839,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8175765645805593,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3285,
"eval_samples_per_second": 569.32,
"eval_steps_per_second": 9.133,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.3948928415775299,
"learning_rate": 1.65e-05,
"loss": 0.0431,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16082525253295898,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8117489986648865,
"eval_overall_precision": 0.7562189054726368,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3338,
"eval_samples_per_second": 560.26,
"eval_steps_per_second": 8.988,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 1.975942611694336,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0427,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6179775280898876,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16873115301132202,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8047493403693932,
"eval_overall_precision": 0.7420924574209246,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3298,
"eval_samples_per_second": 567.09,
"eval_steps_per_second": 9.098,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.47350606322288513,
"learning_rate": 1.55e-05,
"loss": 0.043,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7012987012987013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6067415730337079,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16365033388137817,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8138297872340426,
"eval_overall_precision": 0.7555555555555555,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3349,
"eval_samples_per_second": 558.297,
"eval_steps_per_second": 8.957,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.45649945735931396,
"learning_rate": 1.5e-05,
"loss": 0.0426,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7058823529411765,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6136363636363636,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16292014718055725,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.816,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3342,
"eval_samples_per_second": 559.604,
"eval_steps_per_second": 8.978,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 2.033871650695801,
"learning_rate": 1.45e-05,
"loss": 0.0439,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.775,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7080745341614907,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.59375,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7631578947368421,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6744186046511628,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1787422150373459,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.81151832460733,
"eval_overall_precision": 0.7434052757793765,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3358,
"eval_samples_per_second": 556.823,
"eval_steps_per_second": 8.933,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 1.839992642402649,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0409,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7105263157894737,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16144876182079315,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8172043010752689,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3288,
"eval_samples_per_second": 568.779,
"eval_steps_per_second": 9.125,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.7383960485458374,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0404,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6022727272727273,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16545303165912628,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8122503328894807,
"eval_overall_precision": 0.754950495049505,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3357,
"eval_samples_per_second": 557.128,
"eval_steps_per_second": 8.938,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.1772239208221436,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0399,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16691727936267853,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8133333333333335,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3275,
"eval_samples_per_second": 570.978,
"eval_steps_per_second": 9.16,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.3011506497859955,
"learning_rate": 1.25e-05,
"loss": 0.04,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7105263157894737,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16395699977874756,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8181818181818181,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3338,
"eval_samples_per_second": 560.152,
"eval_steps_per_second": 8.986,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 1.2410697937011719,
"learning_rate": 1.2e-05,
"loss": 0.0402,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7012987012987013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6067415730337079,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16832870244979858,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8127490039840637,
"eval_overall_precision": 0.7536945812807881,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3293,
"eval_samples_per_second": 567.933,
"eval_steps_per_second": 9.111,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 1.8908904790878296,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0402,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7875000000000001,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7078651685393258,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7066666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17024052143096924,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8095872170439414,
"eval_overall_precision": 0.7524752475247525,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3354,
"eval_samples_per_second": 557.526,
"eval_steps_per_second": 8.944,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.9162412881851196,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0379,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6022727272727273,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8653846153846153,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16936184465885162,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8095872170439414,
"eval_overall_precision": 0.7524752475247525,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3352,
"eval_samples_per_second": 557.918,
"eval_steps_per_second": 8.951,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.6435752511024475,
"learning_rate": 1.05e-05,
"loss": 0.0371,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1731194704771042,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8100929614873836,
"eval_overall_precision": 0.7512315270935961,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3345,
"eval_samples_per_second": 559.06,
"eval_steps_per_second": 8.969,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.5504117608070374,
"learning_rate": 1e-05,
"loss": 0.0375,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8025477707006369,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17014098167419434,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8144192256341789,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.339,
"eval_steps_per_second": 8.973,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.46581876277923584,
"learning_rate": 9.5e-06,
"loss": 0.0367,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16831910610198975,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8100929614873836,
"eval_overall_precision": 0.7512315270935961,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3306,
"eval_samples_per_second": 565.697,
"eval_steps_per_second": 9.075,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.1437621116638184,
"learning_rate": 9e-06,
"loss": 0.0369,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6794871794871795,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5824175824175825,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17457380890846252,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8132450331125827,
"eval_overall_precision": 0.7524509803921569,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3281,
"eval_samples_per_second": 569.937,
"eval_steps_per_second": 9.143,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 1.673567771911621,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0382,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16617552936077118,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8106666666666668,
"eval_overall_precision": 0.7543424317617866,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3288,
"eval_samples_per_second": 568.811,
"eval_steps_per_second": 9.125,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.8704581260681152,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0376,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16935382783412933,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8133333333333335,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3375,
"eval_samples_per_second": 554.036,
"eval_steps_per_second": 8.888,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 2.838458299636841,
"learning_rate": 7.5e-06,
"loss": 0.0372,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7006369426751592,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5978260869565217,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17407700419425964,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8143236074270557,
"eval_overall_precision": 0.7542997542997543,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3278,
"eval_samples_per_second": 570.491,
"eval_steps_per_second": 9.152,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.5828319191932678,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0351,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6022727272727273,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17182248830795288,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8111702127659575,
"eval_overall_precision": 0.7530864197530864,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3288,
"eval_samples_per_second": 568.789,
"eval_steps_per_second": 9.125,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.9350789189338684,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0348,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6838709677419356,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5888888888888889,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17128072679042816,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8100929614873836,
"eval_overall_precision": 0.7512315270935961,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3283,
"eval_samples_per_second": 569.617,
"eval_steps_per_second": 9.138,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 1.2203199863433838,
"learning_rate": 6e-06,
"loss": 0.0363,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17074672877788544,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8144192256341789,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3349,
"eval_samples_per_second": 558.334,
"eval_steps_per_second": 8.957,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.67624431848526,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0371,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17176063358783722,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7518427518427518,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3296,
"eval_samples_per_second": 567.418,
"eval_steps_per_second": 9.103,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.9259661436080933,
"learning_rate": 5e-06,
"loss": 0.0367,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8025477707006369,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17073224484920502,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.820855614973262,
"eval_overall_precision": 0.7655860349127181,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3289,
"eval_samples_per_second": 568.538,
"eval_steps_per_second": 9.121,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.5366353392601013,
"learning_rate": 4.5e-06,
"loss": 0.0349,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7096774193548387,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17369931936264038,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8154050464807437,
"eval_overall_precision": 0.7561576354679803,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3356,
"eval_samples_per_second": 557.153,
"eval_steps_per_second": 8.938,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.7619331479072571,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0357,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8025477707006369,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7066666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16904906928539276,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8192771084337349,
"eval_overall_precision": 0.765,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3298,
"eval_samples_per_second": 567.039,
"eval_steps_per_second": 9.097,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.7772564888000488,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0345,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17138922214508057,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8170894526034712,
"eval_overall_precision": 0.7611940298507462,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3291,
"eval_samples_per_second": 568.133,
"eval_steps_per_second": 9.114,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 1.5932378768920898,
"learning_rate": 3e-06,
"loss": 0.0349,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6838709677419356,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5888888888888889,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1765890270471573,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8138297872340426,
"eval_overall_precision": 0.7555555555555555,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3307,
"eval_samples_per_second": 565.487,
"eval_steps_per_second": 9.072,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.8269696235656738,
"learning_rate": 2.5e-06,
"loss": 0.0352,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6838709677419356,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5888888888888889,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17644113302230835,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8127490039840637,
"eval_overall_precision": 0.7536945812807881,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3354,
"eval_samples_per_second": 557.581,
"eval_steps_per_second": 8.945,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 1.2851319313049316,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0367,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17299894988536835,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.816,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3376,
"eval_samples_per_second": 553.982,
"eval_steps_per_second": 8.887,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 1.469909906387329,
"learning_rate": 1.5e-06,
"loss": 0.0352,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6022727272727273,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1724460870027542,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8170894526034712,
"eval_overall_precision": 0.7611940298507462,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.712,
"eval_steps_per_second": 8.963,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.9896478652954102,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0341,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6794871794871795,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5824175824175825,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1747630089521408,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8100929614873836,
"eval_overall_precision": 0.7512315270935961,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3294,
"eval_samples_per_second": 567.729,
"eval_steps_per_second": 9.108,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 1.395708441734314,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0331,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6022727272727273,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17256887257099152,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8133333333333335,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3298,
"eval_samples_per_second": 567.096,
"eval_steps_per_second": 9.098,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.4935811758041382,
"learning_rate": 0.0,
"loss": 0.0347,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6022727272727273,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17283295094966888,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8133333333333335,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.33,
"eval_samples_per_second": 566.66,
"eval_steps_per_second": 9.091,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4639858441347408.0,
"train_loss": 0.08816910017211482,
"train_runtime": 595.5845,
"train_samples_per_second": 283.419,
"train_steps_per_second": 17.798
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4639858441347408.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}