nerugm-pt-pl30-3 / trainer_state.json
apwic's picture
End of training
fab52a0 verified
raw
history blame
144 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 2.5185272693634033,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9922,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012048192771084338,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.0625,
"eval_PERSON_recall": 0.006666666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5609568953514099,
"eval_overall_accuracy": 0.8435984481086324,
"eval_overall_f1": 0.005347593582887699,
"eval_overall_precision": 0.037037037037037035,
"eval_overall_recall": 0.002881844380403458,
"eval_runtime": 0.3848,
"eval_samples_per_second": 485.953,
"eval_steps_per_second": 7.796,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.2335773706436157,
"learning_rate": 4.9e-05,
"loss": 0.4811,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.416,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.48148148148148145,
"eval_LOCATION_recall": 0.36619718309859156,
"eval_ORGANIZATION_f1": 0.14285714285714285,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.14754098360655737,
"eval_ORGANIZATION_recall": 0.13846153846153847,
"eval_PERSON_f1": 0.6887052341597797,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.5868544600938967,
"eval_PERSON_recall": 0.8333333333333334,
"eval_QUANTITY_f1": 0.3692307692307692,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.375,
"eval_QUANTITY_recall": 0.36363636363636365,
"eval_TIME_f1": 0.7586206896551724,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.7857142857142857,
"eval_loss": 0.32625189423561096,
"eval_overall_accuracy": 0.9093113482056256,
"eval_overall_f1": 0.5264586160108549,
"eval_overall_precision": 0.49743589743589745,
"eval_overall_recall": 0.5590778097982709,
"eval_runtime": 0.3833,
"eval_samples_per_second": 487.897,
"eval_steps_per_second": 7.827,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 0.693739652633667,
"learning_rate": 4.85e-05,
"loss": 0.2923,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.6103896103896105,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5662650602409639,
"eval_LOCATION_recall": 0.6619718309859155,
"eval_ORGANIZATION_f1": 0.47619047619047616,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4268292682926829,
"eval_ORGANIZATION_recall": 0.5384615384615384,
"eval_PERSON_f1": 0.8348909657320873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.783625730994152,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.6133333333333334,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5476190476190477,
"eval_QUANTITY_recall": 0.696969696969697,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.19018957018852234,
"eval_overall_accuracy": 0.9338021338506305,
"eval_overall_f1": 0.6948480845442536,
"eval_overall_precision": 0.6414634146341464,
"eval_overall_recall": 0.7579250720461095,
"eval_runtime": 0.3878,
"eval_samples_per_second": 482.181,
"eval_steps_per_second": 7.736,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.1100132465362549,
"learning_rate": 4.8e-05,
"loss": 0.2082,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.7388535031847132,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6744186046511628,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.638036809815951,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5306122448979592,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8589341692789968,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8106508875739645,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15403173863887787,
"eval_overall_accuracy": 0.9459262851600388,
"eval_overall_f1": 0.7700258397932818,
"eval_overall_precision": 0.6978922716627635,
"eval_overall_recall": 0.8587896253602305,
"eval_runtime": 0.3873,
"eval_samples_per_second": 482.781,
"eval_steps_per_second": 7.745,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.3037128448486328,
"learning_rate": 4.75e-05,
"loss": 0.1772,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.7612903225806451,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.6756756756756758,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6024096385542169,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6835443037974683,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5869565217391305,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14435262978076935,
"eval_overall_accuracy": 0.9512609117361784,
"eval_overall_f1": 0.7889182058047493,
"eval_overall_precision": 0.7274939172749392,
"eval_overall_recall": 0.861671469740634,
"eval_runtime": 0.3878,
"eval_samples_per_second": 482.157,
"eval_steps_per_second": 7.735,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.9674538969993591,
"learning_rate": 4.7e-05,
"loss": 0.1576,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7151515151515151,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6276595744680851,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.674698795180723,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5544554455445545,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.866043613707165,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8128654970760234,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6363636363636364,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.509090909090909,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.78125,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1679927557706833,
"eval_overall_accuracy": 0.9413191076624636,
"eval_overall_f1": 0.763681592039801,
"eval_overall_precision": 0.6717724288840262,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3864,
"eval_samples_per_second": 483.937,
"eval_steps_per_second": 7.764,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 1.824372410774231,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.147,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7741935483870968,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7124999999999999,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8606811145510835,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8034682080924855,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1446426808834076,
"eval_overall_accuracy": 0.9519883608147429,
"eval_overall_f1": 0.7927927927927928,
"eval_overall_precision": 0.7162790697674418,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.4021,
"eval_samples_per_second": 465.047,
"eval_steps_per_second": 7.461,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.6194243431091309,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1329,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7453416149068322,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6666666666666666,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.6993865030674845,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5816326530612245,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8643533123028392,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8203592814371258,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14050208032131195,
"eval_overall_accuracy": 0.9517458777885548,
"eval_overall_f1": 0.7948387096774193,
"eval_overall_precision": 0.719626168224299,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3833,
"eval_samples_per_second": 487.894,
"eval_steps_per_second": 7.827,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 0.7105451226234436,
"learning_rate": 4.55e-05,
"loss": 0.1309,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.6628571428571428,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5272727272727272,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6419753086419753,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5416666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.7936507936507937,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13999436795711517,
"eval_overall_accuracy": 0.9471387002909797,
"eval_overall_f1": 0.7774936061381075,
"eval_overall_precision": 0.6988505747126437,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3878,
"eval_samples_per_second": 482.216,
"eval_steps_per_second": 7.736,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.1783398389816284,
"learning_rate": 4.5e-05,
"loss": 0.1247,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8653846153846153,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5777777777777777,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1291128396987915,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.7989276139410187,
"eval_overall_precision": 0.7468671679197995,
"eval_overall_recall": 0.8587896253602305,
"eval_runtime": 0.3867,
"eval_samples_per_second": 483.627,
"eval_steps_per_second": 7.759,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.8099766969680786,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1149,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.708860759493671,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6021505376344086,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.7384615384615384,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6486486486486487,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1423446536064148,
"eval_overall_accuracy": 0.9493210475266731,
"eval_overall_f1": 0.7900262467191601,
"eval_overall_precision": 0.7253012048192771,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3857,
"eval_samples_per_second": 484.776,
"eval_steps_per_second": 7.777,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 0.6322067975997925,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1118,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7239263803680982,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6413043478260869,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7124999999999999,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8125000000000001,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7222222222222222,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15240532159805298,
"eval_overall_accuracy": 0.9493210475266731,
"eval_overall_f1": 0.7902187902187902,
"eval_overall_precision": 0.713953488372093,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3901,
"eval_samples_per_second": 479.371,
"eval_steps_per_second": 7.69,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.8599780797958374,
"learning_rate": 4.35e-05,
"loss": 0.1051,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7307692307692307,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6263736263736264,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.9090909090909091,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9259259259259259,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1298385113477707,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8165997322623828,
"eval_overall_precision": 0.7625,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3867,
"eval_samples_per_second": 483.589,
"eval_steps_per_second": 7.758,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.4172143936157227,
"learning_rate": 4.3e-05,
"loss": 0.1071,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.858974358974359,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8271604938271605,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13883614540100098,
"eval_overall_accuracy": 0.9524733268671193,
"eval_overall_f1": 0.7984084880636606,
"eval_overall_precision": 0.7395577395577395,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3854,
"eval_samples_per_second": 485.176,
"eval_steps_per_second": 7.784,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.1519190073013306,
"learning_rate": 4.25e-05,
"loss": 0.1001,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7261146496815286,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6195652173913043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14001114666461945,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8153034300791556,
"eval_overall_precision": 0.7518248175182481,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3855,
"eval_samples_per_second": 485.068,
"eval_steps_per_second": 7.782,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.1742072105407715,
"learning_rate": 4.2e-05,
"loss": 0.0955,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8025477707006369,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7080745341614907,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.59375,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6753246753246752,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5909090909090909,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14204736053943634,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.806282722513089,
"eval_overall_precision": 0.7386091127098321,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3883,
"eval_samples_per_second": 481.631,
"eval_steps_per_second": 7.727,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 1.7436004877090454,
"learning_rate": 4.15e-05,
"loss": 0.0905,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.7936507936507937,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1411171555519104,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.808,
"eval_overall_precision": 0.7518610421836228,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3859,
"eval_samples_per_second": 484.578,
"eval_steps_per_second": 7.774,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.690143346786499,
"learning_rate": 4.1e-05,
"loss": 0.0882,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7006369426751592,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5978260869565217,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6315789473684211,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5581395348837209,
"eval_QUANTITY_recall": 0.7272727272727273,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14777430891990662,
"eval_overall_accuracy": 0.9536857419980601,
"eval_overall_f1": 0.8031914893617021,
"eval_overall_precision": 0.745679012345679,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3876,
"eval_samples_per_second": 482.459,
"eval_steps_per_second": 7.74,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.7800413370132446,
"learning_rate": 4.05e-05,
"loss": 0.0867,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7755102040816326,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7272727272727272,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7027027027027027,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1365654617547989,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8049113233287859,
"eval_overall_precision": 0.7642487046632125,
"eval_overall_recall": 0.8501440922190202,
"eval_runtime": 0.3898,
"eval_samples_per_second": 479.734,
"eval_steps_per_second": 7.696,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.5175530910491943,
"learning_rate": 4e-05,
"loss": 0.083,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8053691275167785,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7096774193548387,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8766233766233766,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.732394366197183,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14018449187278748,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8135135135135135,
"eval_overall_precision": 0.7659033078880407,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3866,
"eval_samples_per_second": 483.701,
"eval_steps_per_second": 7.76,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.6179842352867126,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0818,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.6993865030674845,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5816326530612245,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6419753086419753,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5416666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15062209963798523,
"eval_overall_accuracy": 0.9524733268671193,
"eval_overall_f1": 0.8078947368421052,
"eval_overall_precision": 0.7433414043583535,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3883,
"eval_samples_per_second": 481.579,
"eval_steps_per_second": 7.726,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.7422575354576111,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0824,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7006369426751592,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5978260869565217,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8580441640378549,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8143712574850299,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14866971969604492,
"eval_overall_accuracy": 0.9546556741028128,
"eval_overall_f1": 0.8010471204188482,
"eval_overall_precision": 0.7338129496402878,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3904,
"eval_samples_per_second": 478.947,
"eval_steps_per_second": 7.684,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.7634256482124329,
"learning_rate": 3.85e-05,
"loss": 0.076,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8053691275167785,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7225806451612903,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6222222222222222,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8823529411764707,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13874635100364685,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8206521739130433,
"eval_overall_precision": 0.7763496143958869,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3855,
"eval_samples_per_second": 485.092,
"eval_steps_per_second": 7.782,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 0.7481046915054321,
"learning_rate": 3.8e-05,
"loss": 0.0745,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7215189873417722,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6129032258064516,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7027027027027027,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14388589560985565,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.821664464993395,
"eval_overall_precision": 0.7585365853658537,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.387,
"eval_samples_per_second": 483.235,
"eval_steps_per_second": 7.752,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.7572817206382751,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0731,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7169811320754718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6063829787234043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1537763774394989,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8222811671087533,
"eval_overall_precision": 0.7616707616707616,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3899,
"eval_samples_per_second": 479.593,
"eval_steps_per_second": 7.694,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.5087524652481079,
"learning_rate": 3.7e-05,
"loss": 0.0713,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7482993197278912,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6707317073170732,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6493506493506495,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5681818181818182,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14748218655586243,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8144192256341789,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3893,
"eval_samples_per_second": 480.312,
"eval_steps_per_second": 7.706,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 1.3006908893585205,
"learning_rate": 3.65e-05,
"loss": 0.0712,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7421383647798743,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6276595744680851,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5777777777777777,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.9090909090909091,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9259259259259259,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1678486168384552,
"eval_overall_accuracy": 0.9517458777885548,
"eval_overall_f1": 0.8089591567852438,
"eval_overall_precision": 0.7451456310679612,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3855,
"eval_samples_per_second": 485.032,
"eval_steps_per_second": 7.781,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 0.8932152986526489,
"learning_rate": 3.6e-05,
"loss": 0.07,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7532467532467532,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.651685393258427,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6486486486486487,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.7272727272727273,
"eval_TIME_f1": 0.8928571428571429,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15593300759792328,
"eval_overall_accuracy": 0.9544131910766246,
"eval_overall_f1": 0.814516129032258,
"eval_overall_precision": 0.7632241813602015,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3874,
"eval_samples_per_second": 482.726,
"eval_steps_per_second": 7.744,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.7077963948249817,
"learning_rate": 3.55e-05,
"loss": 0.0687,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.728395061728395,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6082474226804123,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8737864077669903,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.732394366197183,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.14312958717346191,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8133333333333335,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3863,
"eval_samples_per_second": 484.115,
"eval_steps_per_second": 7.767,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.8946846723556519,
"learning_rate": 3.5e-05,
"loss": 0.0665,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8053691275167785,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7662337662337663,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6629213483146067,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1464053988456726,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.830188679245283,
"eval_overall_precision": 0.779746835443038,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3853,
"eval_samples_per_second": 485.352,
"eval_steps_per_second": 7.786,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.43450927734375,
"learning_rate": 3.45e-05,
"loss": 0.0634,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7222222222222221,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15990784764289856,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8320000000000001,
"eval_overall_precision": 0.7741935483870968,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.386,
"eval_samples_per_second": 484.508,
"eval_steps_per_second": 7.773,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.4396691620349884,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0602,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7741935483870968,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7388535031847134,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6304347826086957,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5952380952380952,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17173334956169128,
"eval_overall_accuracy": 0.9529582929194956,
"eval_overall_f1": 0.8115942028985507,
"eval_overall_precision": 0.7475728155339806,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.387,
"eval_samples_per_second": 483.26,
"eval_steps_per_second": 7.753,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.7759618163108826,
"learning_rate": 3.35e-05,
"loss": 0.0633,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7534246575342466,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6790123456790124,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7222222222222221,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1525535136461258,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8228882833787465,
"eval_overall_precision": 0.7803617571059431,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.386,
"eval_samples_per_second": 484.395,
"eval_steps_per_second": 7.771,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.0217112302780151,
"learning_rate": 3.3e-05,
"loss": 0.0596,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7261146496815286,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6195652173913043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7123287671232875,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8070175438596492,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.15602585673332214,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.8154050464807437,
"eval_overall_precision": 0.7561576354679803,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.385,
"eval_samples_per_second": 485.685,
"eval_steps_per_second": 7.792,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.47391146421432495,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0591,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7261146496815286,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6195652173913043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7222222222222221,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1562255322933197,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8186666666666667,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3871,
"eval_samples_per_second": 483.118,
"eval_steps_per_second": 7.751,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.473497748374939,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0582,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7160493827160493,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5979381443298969,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1698862910270691,
"eval_overall_accuracy": 0.9524733268671193,
"eval_overall_f1": 0.8184210526315788,
"eval_overall_precision": 0.7530266343825666,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3888,
"eval_samples_per_second": 480.937,
"eval_steps_per_second": 7.716,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.5742448568344116,
"learning_rate": 3.15e-05,
"loss": 0.0567,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.775,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7169811320754718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6063829787234043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17796191573143005,
"eval_overall_accuracy": 0.9498060135790495,
"eval_overall_f1": 0.8073394495412844,
"eval_overall_precision": 0.7403846153846154,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3904,
"eval_samples_per_second": 479.01,
"eval_steps_per_second": 7.685,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.6908618211746216,
"learning_rate": 3.1e-05,
"loss": 0.0568,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8053691275167785,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7482993197278912,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6707317073170732,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6933333333333334,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6190476190476191,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1589268296957016,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8216216216216217,
"eval_overall_precision": 0.7735368956743003,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.387,
"eval_samples_per_second": 483.227,
"eval_steps_per_second": 7.752,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.37814459204673767,
"learning_rate": 3.05e-05,
"loss": 0.0553,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.759493670886076,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6896551724137931,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7195121951219511,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5959595959595959,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8475609756097561,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17944246530532837,
"eval_overall_accuracy": 0.9500484966052376,
"eval_overall_f1": 0.8120104438642298,
"eval_overall_precision": 0.7422434367541766,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3856,
"eval_samples_per_second": 484.921,
"eval_steps_per_second": 7.779,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.3985283672809601,
"learning_rate": 3e-05,
"loss": 0.0522,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.732394366197183,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16948159039020538,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8196286472148541,
"eval_overall_precision": 0.7592137592137592,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3866,
"eval_samples_per_second": 483.76,
"eval_steps_per_second": 7.761,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.4095101058483124,
"learning_rate": 2.95e-05,
"loss": 0.0535,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6842105263157895,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6046511627906976,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16789713501930237,
"eval_overall_accuracy": 0.9517458777885548,
"eval_overall_f1": 0.8090185676392573,
"eval_overall_precision": 0.7493857493857494,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3862,
"eval_samples_per_second": 484.225,
"eval_steps_per_second": 7.768,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.30107811093330383,
"learning_rate": 2.9e-05,
"loss": 0.0507,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7248322147651007,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15727120637893677,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.8221024258760108,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3852,
"eval_samples_per_second": 485.428,
"eval_steps_per_second": 7.788,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.3901791274547577,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0501,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6967741935483871,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1803949922323227,
"eval_overall_accuracy": 0.9524733268671193,
"eval_overall_f1": 0.8100263852242744,
"eval_overall_precision": 0.7469586374695864,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3846,
"eval_samples_per_second": 486.267,
"eval_steps_per_second": 7.801,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.7794935703277588,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0491,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.6918238993710691,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5851063829787234,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1680927574634552,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.8105960264900663,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.387,
"eval_samples_per_second": 483.206,
"eval_steps_per_second": 7.752,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.7887659072875977,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0478,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7448275862068966,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.675,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16480599343776703,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8297297297297298,
"eval_overall_precision": 0.7811704834605598,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3859,
"eval_samples_per_second": 484.601,
"eval_steps_per_second": 7.774,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.7143243551254272,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0475,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15505646169185638,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.824631860776439,
"eval_overall_precision": 0.77,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3863,
"eval_samples_per_second": 484.039,
"eval_steps_per_second": 7.765,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.987457811832428,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0462,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16851799190044403,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.8139223560910308,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3876,
"eval_samples_per_second": 482.46,
"eval_steps_per_second": 7.74,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.8889041543006897,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0467,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17139677703380585,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8306451612903226,
"eval_overall_precision": 0.7783375314861462,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3868,
"eval_samples_per_second": 483.496,
"eval_steps_per_second": 7.757,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.43323248624801636,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0462,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7448275862068966,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.675,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7714285714285715,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1640593409538269,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8288043478260869,
"eval_overall_precision": 0.7840616966580977,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3874,
"eval_samples_per_second": 482.695,
"eval_steps_per_second": 7.744,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.8610317707061768,
"learning_rate": 2.5e-05,
"loss": 0.0467,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16927781701087952,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8183041722745625,
"eval_overall_precision": 0.7676767676767676,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3864,
"eval_samples_per_second": 483.901,
"eval_steps_per_second": 7.763,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.744925320148468,
"learning_rate": 2.45e-05,
"loss": 0.0437,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.6896551724137931,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17594219744205475,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8075370121130553,
"eval_overall_precision": 0.7575757575757576,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.3854,
"eval_samples_per_second": 485.269,
"eval_steps_per_second": 7.785,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.9806845784187317,
"learning_rate": 2.4e-05,
"loss": 0.0435,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8025477707006369,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7567567567567568,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6746987951807228,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18336325883865356,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8273092369477911,
"eval_overall_precision": 0.7725,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.387,
"eval_samples_per_second": 483.258,
"eval_steps_per_second": 7.753,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.8235753178596497,
"learning_rate": 2.35e-05,
"loss": 0.0441,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7307692307692307,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6263736263736264,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1896522045135498,
"eval_overall_accuracy": 0.9546556741028128,
"eval_overall_f1": 0.8249336870026525,
"eval_overall_precision": 0.7641277641277642,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3882,
"eval_samples_per_second": 481.674,
"eval_steps_per_second": 7.727,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.6915778517723083,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.042,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7402597402597403,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6404494382022472,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18752093613147736,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.8196286472148541,
"eval_overall_precision": 0.7592137592137592,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3905,
"eval_samples_per_second": 478.818,
"eval_steps_per_second": 7.682,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.8931111097335815,
"learning_rate": 2.25e-05,
"loss": 0.0414,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7241379310344828,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.6923076923076923,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5934065934065934,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6842105263157895,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6046511627906976,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18678565323352814,
"eval_overall_accuracy": 0.9544131910766246,
"eval_overall_f1": 0.8031496062992126,
"eval_overall_precision": 0.7373493975903614,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3856,
"eval_samples_per_second": 485.009,
"eval_steps_per_second": 7.781,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.4860210418701172,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0408,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7152317880794703,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.627906976744186,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.732394366197183,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17208231985569,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8161073825503355,
"eval_overall_precision": 0.7638190954773869,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3889,
"eval_samples_per_second": 480.88,
"eval_steps_per_second": 7.715,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.5651527047157288,
"learning_rate": 2.15e-05,
"loss": 0.0388,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7222222222222222,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6582278481012658,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7123287671232875,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.18390165269374847,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.8178137651821863,
"eval_overall_precision": 0.7690355329949239,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3888,
"eval_samples_per_second": 481.0,
"eval_steps_per_second": 7.717,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.2999099791049957,
"learning_rate": 2.1e-05,
"loss": 0.039,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7006369426751592,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5978260869565217,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7123287671232875,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17726965248584747,
"eval_overall_accuracy": 0.9527158098933075,
"eval_overall_f1": 0.8095872170439414,
"eval_overall_precision": 0.7524752475247525,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3872,
"eval_samples_per_second": 482.921,
"eval_steps_per_second": 7.747,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.43868881464004517,
"learning_rate": 2.05e-05,
"loss": 0.0414,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16531790792942047,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8184281842818427,
"eval_overall_precision": 0.7723785166240409,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3889,
"eval_samples_per_second": 480.89,
"eval_steps_per_second": 7.715,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.5318551659584045,
"learning_rate": 2e-05,
"loss": 0.0379,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7808219178082192,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.76,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1694074124097824,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.8142076502732241,
"eval_overall_precision": 0.7740259740259741,
"eval_overall_recall": 0.8587896253602305,
"eval_runtime": 0.3853,
"eval_samples_per_second": 485.37,
"eval_steps_per_second": 7.787,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.2059674263000488,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0391,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7058823529411765,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6136363636363636,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7123287671232875,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1873074322938919,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8138297872340426,
"eval_overall_precision": 0.7555555555555555,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.393,
"eval_samples_per_second": 475.865,
"eval_steps_per_second": 7.634,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.812824010848999,
"learning_rate": 1.9e-05,
"loss": 0.0372,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7248322147651007,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17852064967155457,
"eval_overall_accuracy": 0.9558680892337537,
"eval_overall_f1": 0.8176943699731903,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3865,
"eval_samples_per_second": 483.888,
"eval_steps_per_second": 7.763,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.8590715527534485,
"learning_rate": 1.85e-05,
"loss": 0.0371,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17511434853076935,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8232118758434548,
"eval_overall_precision": 0.7741116751269036,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3898,
"eval_samples_per_second": 479.785,
"eval_steps_per_second": 7.697,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.4557998478412628,
"learning_rate": 1.8e-05,
"loss": 0.0348,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7248322147651007,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7714285714285715,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1811322569847107,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.825268817204301,
"eval_overall_precision": 0.7732997481108312,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3884,
"eval_samples_per_second": 481.467,
"eval_steps_per_second": 7.724,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.6341075897216797,
"learning_rate": 1.75e-05,
"loss": 0.0338,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1845623105764389,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.8203753351206434,
"eval_overall_precision": 0.7669172932330827,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3877,
"eval_samples_per_second": 482.316,
"eval_steps_per_second": 7.738,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.8572676777839661,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.033,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1916947364807129,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.8207171314741034,
"eval_overall_precision": 0.7610837438423645,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3895,
"eval_samples_per_second": 480.163,
"eval_steps_per_second": 7.703,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.2351032942533493,
"learning_rate": 1.65e-05,
"loss": 0.0347,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18072670698165894,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8189189189189189,
"eval_overall_precision": 0.7709923664122137,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3888,
"eval_samples_per_second": 481.006,
"eval_steps_per_second": 7.717,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.4664683938026428,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.034,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1870609074831009,
"eval_overall_accuracy": 0.9558680892337537,
"eval_overall_f1": 0.8165997322623828,
"eval_overall_precision": 0.7625,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3882,
"eval_samples_per_second": 481.675,
"eval_steps_per_second": 7.727,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.3841381072998047,
"learning_rate": 1.55e-05,
"loss": 0.0319,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.775,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18617138266563416,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.8181818181818181,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3893,
"eval_samples_per_second": 480.405,
"eval_steps_per_second": 7.707,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.48607921600341797,
"learning_rate": 1.5e-05,
"loss": 0.0338,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7199999999999999,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6352941176470588,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1894809454679489,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.824631860776439,
"eval_overall_precision": 0.77,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3875,
"eval_samples_per_second": 482.595,
"eval_steps_per_second": 7.742,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.6728916168212891,
"learning_rate": 1.45e-05,
"loss": 0.0306,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20611025393009186,
"eval_overall_accuracy": 0.9558680892337537,
"eval_overall_f1": 0.8202396804260986,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3866,
"eval_samples_per_second": 483.747,
"eval_steps_per_second": 7.761,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.954484760761261,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0343,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19823096692562103,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.8202396804260986,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3914,
"eval_samples_per_second": 477.758,
"eval_steps_per_second": 7.665,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.27965471148490906,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0308,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7586206896551724,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.732394366197183,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19675639271736145,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8247978436657682,
"eval_overall_precision": 0.7746835443037975,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3896,
"eval_samples_per_second": 480.01,
"eval_steps_per_second": 7.701,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.283292531967163,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0328,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.7770700636942676,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19934506714344025,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.8172043010752689,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3876,
"eval_samples_per_second": 482.397,
"eval_steps_per_second": 7.739,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 1.0608142614364624,
"learning_rate": 1.25e-05,
"loss": 0.0328,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.7741935483870968,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19247645139694214,
"eval_overall_accuracy": 0.9558680892337537,
"eval_overall_f1": 0.814516129032258,
"eval_overall_precision": 0.7632241813602015,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3884,
"eval_samples_per_second": 481.515,
"eval_steps_per_second": 7.725,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.5310276746749878,
"learning_rate": 1.2e-05,
"loss": 0.0314,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.7631578947368421,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.732394366197183,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19101466238498688,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.8151147098515519,
"eval_overall_precision": 0.766497461928934,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.389,
"eval_samples_per_second": 480.741,
"eval_steps_per_second": 7.712,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.7759119868278503,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0304,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7027027027027027,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6265060240963856,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19821016490459442,
"eval_overall_accuracy": 0.9544131910766246,
"eval_overall_f1": 0.8037383177570094,
"eval_overall_precision": 0.7487562189054726,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3876,
"eval_samples_per_second": 482.51,
"eval_steps_per_second": 7.741,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.5382179021835327,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0318,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7105263157894737,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6578947368421053,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5813953488372093,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2088189721107483,
"eval_overall_accuracy": 0.9527158098933075,
"eval_overall_f1": 0.7994722955145119,
"eval_overall_precision": 0.7372262773722628,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3895,
"eval_samples_per_second": 480.105,
"eval_steps_per_second": 7.702,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.7348619103431702,
"learning_rate": 1.05e-05,
"loss": 0.0303,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.704225352112676,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20289956033229828,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.8074866310160428,
"eval_overall_precision": 0.7531172069825436,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.392,
"eval_samples_per_second": 476.992,
"eval_steps_per_second": 7.652,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.42746540904045105,
"learning_rate": 1e-05,
"loss": 0.0289,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6944444444444444,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6410256410256411,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2005331665277481,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.8032345013477089,
"eval_overall_precision": 0.7544303797468355,
"eval_overall_recall": 0.8587896253602305,
"eval_runtime": 0.3897,
"eval_samples_per_second": 479.848,
"eval_steps_per_second": 7.698,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.303906112909317,
"learning_rate": 9.5e-06,
"loss": 0.0283,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.7692307692307694,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7058823529411765,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7448275862068966,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.675,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.704225352112676,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20049220323562622,
"eval_overall_accuracy": 0.9558680892337537,
"eval_overall_f1": 0.8113207547169812,
"eval_overall_precision": 0.7620253164556962,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3866,
"eval_samples_per_second": 483.757,
"eval_steps_per_second": 7.761,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.8275718688964844,
"learning_rate": 9e-06,
"loss": 0.0303,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7142857142857142,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19804218411445618,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8167115902964959,
"eval_overall_precision": 0.7670886075949367,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3912,
"eval_samples_per_second": 478.031,
"eval_steps_per_second": 7.669,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 3.0445024967193604,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0281,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.704225352112676,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19731304049491882,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8113207547169812,
"eval_overall_precision": 0.7620253164556962,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3907,
"eval_samples_per_second": 478.583,
"eval_steps_per_second": 7.678,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.6099753379821777,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0281,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7142857142857142,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20074868202209473,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8165997322623828,
"eval_overall_precision": 0.7625,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3897,
"eval_samples_per_second": 479.814,
"eval_steps_per_second": 7.698,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.7372535467147827,
"learning_rate": 7.5e-06,
"loss": 0.0291,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7692307692307694,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7058823529411765,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7142857142857142,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20446744561195374,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.8123324396782842,
"eval_overall_precision": 0.7593984962406015,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3955,
"eval_samples_per_second": 472.842,
"eval_steps_per_second": 7.586,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.5419071316719055,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0286,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7466666666666668,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6588235294117647,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19124767184257507,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8247978436657682,
"eval_overall_precision": 0.7746835443037975,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3984,
"eval_samples_per_second": 469.353,
"eval_steps_per_second": 7.53,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 1.295188546180725,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0267,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7466666666666668,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6588235294117647,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1960640400648117,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8241610738255033,
"eval_overall_precision": 0.7713567839195979,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3949,
"eval_samples_per_second": 473.507,
"eval_steps_per_second": 7.596,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.27405989170074463,
"learning_rate": 6e-06,
"loss": 0.0282,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7567567567567568,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6746987951807228,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6849315068493151,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19417804479599,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8150134048257373,
"eval_overall_precision": 0.7619047619047619,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3924,
"eval_samples_per_second": 476.565,
"eval_steps_per_second": 7.645,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.466235876083374,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0251,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7619047619047619,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6829268292682927,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6849315068493151,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2023736834526062,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.8203753351206434,
"eval_overall_precision": 0.7669172932330827,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3932,
"eval_samples_per_second": 475.644,
"eval_steps_per_second": 7.631,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.620521068572998,
"learning_rate": 5e-06,
"loss": 0.027,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7567567567567568,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6746987951807228,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7714285714285715,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19653601944446564,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8297297297297298,
"eval_overall_precision": 0.7811704834605598,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3926,
"eval_samples_per_second": 476.265,
"eval_steps_per_second": 7.641,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 1.394244909286499,
"learning_rate": 4.5e-06,
"loss": 0.0268,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7741935483870968,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7567567567567568,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6746987951807228,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7605633802816901,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2078668475151062,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.8236877523553162,
"eval_overall_precision": 0.7727272727272727,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3926,
"eval_samples_per_second": 476.299,
"eval_steps_per_second": 7.641,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.33064666390419006,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0256,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7466666666666668,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6588235294117647,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19762425124645233,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8257372654155496,
"eval_overall_precision": 0.7719298245614035,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3911,
"eval_samples_per_second": 478.123,
"eval_steps_per_second": 7.67,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.47633665800094604,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0258,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1961781531572342,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8214765100671141,
"eval_overall_precision": 0.7688442211055276,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3912,
"eval_samples_per_second": 478.005,
"eval_steps_per_second": 7.669,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.8689398169517517,
"learning_rate": 3e-06,
"loss": 0.0233,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7466666666666668,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6588235294117647,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19755157828330994,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8214765100671141,
"eval_overall_precision": 0.7688442211055276,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3938,
"eval_samples_per_second": 474.89,
"eval_steps_per_second": 7.619,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.12069670855998993,
"learning_rate": 2.5e-06,
"loss": 0.0259,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7482993197278912,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6707317073170732,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19969353079795837,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8221024258760108,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3908,
"eval_samples_per_second": 478.563,
"eval_steps_per_second": 7.677,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.6587622761726379,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0253,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20329639315605164,
"eval_overall_accuracy": 0.95635305528613,
"eval_overall_f1": 0.8203753351206434,
"eval_overall_precision": 0.7669172932330827,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.391,
"eval_samples_per_second": 478.228,
"eval_steps_per_second": 7.672,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.5734129548072815,
"learning_rate": 1.5e-06,
"loss": 0.0251,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20106351375579834,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8225806451612904,
"eval_overall_precision": 0.7707808564231738,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3918,
"eval_samples_per_second": 477.341,
"eval_steps_per_second": 7.658,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.6452818512916565,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0237,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20484283566474915,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.823529411764706,
"eval_overall_precision": 0.7680798004987531,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3905,
"eval_samples_per_second": 478.82,
"eval_steps_per_second": 7.682,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.052759163081645966,
"learning_rate": 5.000000000000001e-07,
"loss": 0.024,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.20229747891426086,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8268456375838926,
"eval_overall_precision": 0.7738693467336684,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3938,
"eval_samples_per_second": 474.901,
"eval_steps_per_second": 7.619,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.5731909871101379,
"learning_rate": 0.0,
"loss": 0.0257,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7567567567567568,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6746987951807228,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7428571428571429,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2022850662469864,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8279569892473119,
"eval_overall_precision": 0.7758186397984886,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3925,
"eval_samples_per_second": 476.464,
"eval_steps_per_second": 7.644,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5123217774191952.0,
"train_loss": 0.07238403747666557,
"train_runtime": 634.3549,
"train_samples_per_second": 266.097,
"train_steps_per_second": 16.71
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5123217774191952.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}