nerugm-lora-r8-2 / trainer_state.json
apwic's picture
End of training
59470e3 verified
raw
history blame
144 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.7324131727218628,
"learning_rate": 4.9500000000000004e-05,
"loss": 1.2621,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.0,
"eval_PERSON_recall": 0.0,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.7093822360038757,
"eval_overall_accuracy": 0.8448836627470603,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_runtime": 1.1248,
"eval_samples_per_second": 166.252,
"eval_steps_per_second": 2.667,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.321110725402832,
"learning_rate": 4.9e-05,
"loss": 0.7066,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.0,
"eval_PERSON_recall": 0.0,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5970483422279358,
"eval_overall_accuracy": 0.845634225669252,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_runtime": 0.9359,
"eval_samples_per_second": 199.818,
"eval_steps_per_second": 3.206,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.2591755390167236,
"learning_rate": 4.85e-05,
"loss": 0.6211,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.02702702702702703,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.5,
"eval_LOCATION_recall": 0.013888888888888888,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.06211180124223603,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.2777777777777778,
"eval_PERSON_recall": 0.03496503496503497,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5052209496498108,
"eval_overall_accuracy": 0.8516387290467851,
"eval_overall_f1": 0.03252032520325203,
"eval_overall_precision": 0.2,
"eval_overall_recall": 0.017699115044247787,
"eval_runtime": 0.9647,
"eval_samples_per_second": 193.841,
"eval_steps_per_second": 3.11,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.9562969207763672,
"learning_rate": 4.8e-05,
"loss": 0.5308,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.14457831325301204,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.5454545454545454,
"eval_LOCATION_recall": 0.08333333333333333,
"eval_ORGANIZATION_f1": 0.02197802197802198,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.0625,
"eval_ORGANIZATION_recall": 0.013333333333333334,
"eval_PERSON_f1": 0.31666666666666665,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.3917525773195876,
"eval_PERSON_recall": 0.26573426573426573,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.3181818181818182,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.3888888888888889,
"eval_TIME_recall": 0.2692307692307692,
"eval_loss": 0.4113342761993408,
"eval_overall_accuracy": 0.879909932449337,
"eval_overall_f1": 0.2162162162162162,
"eval_overall_precision": 0.36619718309859156,
"eval_overall_recall": 0.15339233038348082,
"eval_runtime": 0.9301,
"eval_samples_per_second": 201.053,
"eval_steps_per_second": 3.225,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.885956883430481,
"learning_rate": 4.75e-05,
"loss": 0.427,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.4424778761061947,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6097560975609756,
"eval_LOCATION_recall": 0.3472222222222222,
"eval_ORGANIZATION_f1": 0.27272727272727276,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.42857142857142855,
"eval_ORGANIZATION_recall": 0.2,
"eval_PERSON_f1": 0.6179401993355481,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.5886075949367089,
"eval_PERSON_recall": 0.6503496503496503,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.6382978723404256,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.5769230769230769,
"eval_loss": 0.3248092830181122,
"eval_overall_accuracy": 0.9101826369777333,
"eval_overall_f1": 0.49006622516556286,
"eval_overall_precision": 0.5584905660377358,
"eval_overall_recall": 0.4365781710914454,
"eval_runtime": 0.8911,
"eval_samples_per_second": 209.848,
"eval_steps_per_second": 3.367,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.2173807621002197,
"learning_rate": 4.7e-05,
"loss": 0.3429,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.593103448275862,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.589041095890411,
"eval_LOCATION_recall": 0.5972222222222222,
"eval_ORGANIZATION_f1": 0.4729729729729729,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.4794520547945205,
"eval_ORGANIZATION_recall": 0.4666666666666667,
"eval_PERSON_f1": 0.7538940809968847,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.6797752808988764,
"eval_PERSON_recall": 0.8461538461538461,
"eval_QUANTITY_f1": 0.15999999999999998,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.14814814814814814,
"eval_QUANTITY_recall": 0.17391304347826086,
"eval_TIME_f1": 0.6666666666666666,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6428571428571429,
"eval_TIME_recall": 0.6923076923076923,
"eval_loss": 0.2732473909854889,
"eval_overall_accuracy": 0.9274455841881412,
"eval_overall_f1": 0.6155988857938719,
"eval_overall_precision": 0.58311345646438,
"eval_overall_recall": 0.6519174041297935,
"eval_runtime": 0.887,
"eval_samples_per_second": 210.819,
"eval_steps_per_second": 3.382,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.8688632845878601,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.2873,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.6623376623376623,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6219512195121951,
"eval_LOCATION_recall": 0.7083333333333334,
"eval_ORGANIZATION_f1": 0.4968152866242038,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.47560975609756095,
"eval_ORGANIZATION_recall": 0.52,
"eval_PERSON_f1": 0.80625,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7288135593220338,
"eval_PERSON_recall": 0.9020979020979021,
"eval_QUANTITY_f1": 0.2962962962962963,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.25806451612903225,
"eval_QUANTITY_recall": 0.34782608695652173,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.23371461033821106,
"eval_overall_accuracy": 0.9329497122842132,
"eval_overall_f1": 0.6675675675675676,
"eval_overall_precision": 0.6159600997506235,
"eval_overall_recall": 0.7286135693215339,
"eval_runtime": 0.9045,
"eval_samples_per_second": 206.749,
"eval_steps_per_second": 3.317,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 1.5551362037658691,
"learning_rate": 4.600000000000001e-05,
"loss": 0.249,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.732919254658385,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6629213483146067,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.5813953488372093,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5154639175257731,
"eval_ORGANIZATION_recall": 0.6666666666666666,
"eval_PERSON_f1": 0.832807570977918,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7586206896551724,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.2962962962962963,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.25806451612903225,
"eval_QUANTITY_recall": 0.34782608695652173,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.2129368931055069,
"eval_overall_accuracy": 0.9367025268951714,
"eval_overall_f1": 0.7088274044795784,
"eval_overall_precision": 0.6404761904761904,
"eval_overall_recall": 0.7935103244837758,
"eval_runtime": 0.9166,
"eval_samples_per_second": 204.019,
"eval_steps_per_second": 3.273,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.3527239561080933,
"learning_rate": 4.55e-05,
"loss": 0.2259,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7625000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6931818181818182,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.6046511627906977,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5360824742268041,
"eval_ORGANIZATION_recall": 0.6933333333333334,
"eval_PERSON_f1": 0.8360128617363344,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7738095238095238,
"eval_PERSON_recall": 0.9090909090909091,
"eval_QUANTITY_f1": 0.3103448275862069,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.2571428571428571,
"eval_QUANTITY_recall": 0.391304347826087,
"eval_TIME_f1": 0.7272727272727274,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6896551724137931,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.19730736315250397,
"eval_overall_accuracy": 0.9384538403802852,
"eval_overall_f1": 0.7195767195767195,
"eval_overall_precision": 0.6522781774580336,
"eval_overall_recall": 0.8023598820058997,
"eval_runtime": 0.9257,
"eval_samples_per_second": 202.019,
"eval_steps_per_second": 3.241,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 2.4482581615448,
"learning_rate": 4.5e-05,
"loss": 0.2088,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7654320987654321,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6888888888888889,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.5847953216374269,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5208333333333334,
"eval_ORGANIZATION_recall": 0.6666666666666666,
"eval_PERSON_f1": 0.840764331210191,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7719298245614035,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.4137931034482759,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.34285714285714286,
"eval_QUANTITY_recall": 0.5217391304347826,
"eval_TIME_f1": 0.6666666666666667,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6129032258064516,
"eval_TIME_recall": 0.7307692307692307,
"eval_loss": 0.18520984053611755,
"eval_overall_accuracy": 0.9392044033024769,
"eval_overall_f1": 0.7217847769028872,
"eval_overall_precision": 0.6501182033096927,
"eval_overall_recall": 0.8112094395280236,
"eval_runtime": 0.9227,
"eval_samples_per_second": 202.666,
"eval_steps_per_second": 3.251,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.6825419664382935,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.196,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7974683544303797,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.5868263473053893,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.532608695652174,
"eval_ORGANIZATION_recall": 0.6533333333333333,
"eval_PERSON_f1": 0.8488745980707394,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7857142857142857,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.3928571428571428,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.3333333333333333,
"eval_QUANTITY_recall": 0.4782608695652174,
"eval_TIME_f1": 0.7142857142857142,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1723126471042633,
"eval_overall_accuracy": 0.9434575931948962,
"eval_overall_f1": 0.7352941176470589,
"eval_overall_precision": 0.6723716381418093,
"eval_overall_recall": 0.8112094395280236,
"eval_runtime": 0.9093,
"eval_samples_per_second": 205.658,
"eval_steps_per_second": 3.299,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 2.3418383598327637,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1884,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.6473988439306357,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5714285714285714,
"eval_ORGANIZATION_recall": 0.7466666666666667,
"eval_PERSON_f1": 0.8461538461538461,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7810650887573964,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.4814814814814815,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.41935483870967744,
"eval_QUANTITY_recall": 0.5652173913043478,
"eval_TIME_f1": 0.7,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6176470588235294,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1679195761680603,
"eval_overall_accuracy": 0.9444583437578183,
"eval_overall_f1": 0.7526595744680852,
"eval_overall_precision": 0.6852300242130751,
"eval_overall_recall": 0.8348082595870207,
"eval_runtime": 0.9102,
"eval_samples_per_second": 205.442,
"eval_steps_per_second": 3.296,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 1.0822410583496094,
"learning_rate": 4.35e-05,
"loss": 0.1791,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.6744186046511628,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5979381443298969,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8488745980707394,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7857142857142857,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.5185185185185185,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.45161290322580644,
"eval_QUANTITY_recall": 0.6086956521739131,
"eval_TIME_f1": 0.7118644067796609,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6363636363636364,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.16172969341278076,
"eval_overall_accuracy": 0.9467100325243933,
"eval_overall_f1": 0.7603748326639893,
"eval_overall_precision": 0.696078431372549,
"eval_overall_recall": 0.8377581120943953,
"eval_runtime": 0.9055,
"eval_samples_per_second": 206.514,
"eval_steps_per_second": 3.313,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.5624088048934937,
"learning_rate": 4.3e-05,
"loss": 0.1713,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.6704545454545454,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5841584158415841,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8636363636363636,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.806060606060606,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.5098039215686274,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.4642857142857143,
"eval_QUANTITY_recall": 0.5652173913043478,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15461112558841705,
"eval_overall_accuracy": 0.9497122842131599,
"eval_overall_f1": 0.7713125845737482,
"eval_overall_precision": 0.7125,
"eval_overall_recall": 0.8407079646017699,
"eval_runtime": 0.9063,
"eval_samples_per_second": 206.328,
"eval_steps_per_second": 3.31,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.8365355730056763,
"learning_rate": 4.25e-05,
"loss": 0.1674,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6704545454545454,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5841584158415841,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8543689320388351,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7951807228915663,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.49056603773584906,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.43333333333333335,
"eval_QUANTITY_recall": 0.5652173913043478,
"eval_TIME_f1": 0.7241379310344829,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.65625,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1564231663942337,
"eval_overall_accuracy": 0.9494620965724293,
"eval_overall_f1": 0.761014686248331,
"eval_overall_precision": 0.6951219512195121,
"eval_overall_recall": 0.8407079646017699,
"eval_runtime": 0.9118,
"eval_samples_per_second": 205.09,
"eval_steps_per_second": 3.29,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.1776515245437622,
"learning_rate": 4.2e-05,
"loss": 0.1623,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6818181818181819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.594059405940594,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8571428571428571,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7719298245614036,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7096774193548387,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15418055653572083,
"eval_overall_accuracy": 0.9509632224168126,
"eval_overall_f1": 0.7780748663101604,
"eval_overall_precision": 0.7114914425427873,
"eval_overall_recall": 0.8584070796460177,
"eval_runtime": 0.9082,
"eval_samples_per_second": 205.891,
"eval_steps_per_second": 3.303,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.6350365877151489,
"learning_rate": 4.15e-05,
"loss": 0.158,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.751592356687898,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6941176470588235,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5784313725490197,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8636363636363636,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.806060606060606,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7719298245614036,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7096774193548387,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15079031884670258,
"eval_overall_accuracy": 0.950212659494621,
"eval_overall_f1": 0.7708609271523179,
"eval_overall_precision": 0.6995192307692307,
"eval_overall_recall": 0.8584070796460177,
"eval_runtime": 0.9247,
"eval_samples_per_second": 202.221,
"eval_steps_per_second": 3.244,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.8113768100738525,
"learning_rate": 4.1e-05,
"loss": 0.1518,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.759493670886076,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6976744186046512,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5784313725490197,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8580645161290323,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.7964071856287425,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7719298245614036,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7096774193548387,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1505645364522934,
"eval_overall_accuracy": 0.9497122842131599,
"eval_overall_f1": 0.770448548812665,
"eval_overall_precision": 0.6968973747016707,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9072,
"eval_samples_per_second": 206.139,
"eval_steps_per_second": 3.307,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 1.1493066549301147,
"learning_rate": 4.05e-05,
"loss": 0.1508,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.6820809248554913,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6020408163265306,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14393331110477448,
"eval_overall_accuracy": 0.9532149111833875,
"eval_overall_f1": 0.7881241565452092,
"eval_overall_precision": 0.7263681592039801,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9095,
"eval_samples_per_second": 205.605,
"eval_steps_per_second": 3.298,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.1086537837982178,
"learning_rate": 4e-05,
"loss": 0.1435,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5585585585585585,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8627450980392156,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8098159509202454,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7719298245614036,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7096774193548387,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15614458918571472,
"eval_overall_accuracy": 0.950212659494621,
"eval_overall_f1": 0.7769028871391076,
"eval_overall_precision": 0.6997635933806147,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9172,
"eval_samples_per_second": 203.874,
"eval_steps_per_second": 3.271,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.9740850925445557,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.1456,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.6705202312138728,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5918367346938775,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8721311475409836,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14360801875591278,
"eval_overall_accuracy": 0.9537152864648486,
"eval_overall_f1": 0.7816711590296497,
"eval_overall_precision": 0.7196029776674938,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9095,
"eval_samples_per_second": 205.608,
"eval_steps_per_second": 3.299,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.8203905820846558,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.1384,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7126436781609197,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6262626262626263,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8758169934640523,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8220858895705522,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14492544531822205,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.8016085790884719,
"eval_overall_precision": 0.7346437346437347,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9167,
"eval_samples_per_second": 203.986,
"eval_steps_per_second": 3.273,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 5.496976375579834,
"learning_rate": 3.85e-05,
"loss": 0.1384,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7011494252873564,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6161616161616161,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8786885245901639,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8271604938271605,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.14144913852214813,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.8005390835579514,
"eval_overall_precision": 0.7369727047146402,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9123,
"eval_samples_per_second": 204.982,
"eval_steps_per_second": 3.288,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.060779333114624,
"learning_rate": 3.8e-05,
"loss": 0.1369,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7898089171974522,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.6775956284153005,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.5740740740740741,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8627450980392156,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8098159509202454,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1503037065267563,
"eval_overall_accuracy": 0.9509632224168126,
"eval_overall_f1": 0.7820343461030383,
"eval_overall_precision": 0.7081339712918661,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9133,
"eval_samples_per_second": 204.754,
"eval_steps_per_second": 3.285,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.9608832001686096,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.136,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7058823529411765,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.631578947368421,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8758169934640523,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8220858895705522,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1423281729221344,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.7951482479784365,
"eval_overall_precision": 0.7320099255583127,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9155,
"eval_samples_per_second": 204.256,
"eval_steps_per_second": 3.277,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 1.9149385690689087,
"learning_rate": 3.7e-05,
"loss": 0.1322,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7209302325581395,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6391752577319587,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8758169934640523,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8220858895705522,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14195844531059265,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.7994616419919246,
"eval_overall_precision": 0.7351485148514851,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9182,
"eval_samples_per_second": 203.651,
"eval_steps_per_second": 3.267,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 4.680337905883789,
"learning_rate": 3.65e-05,
"loss": 0.1323,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7305389221556886,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6630434782608695,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14178352057933807,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8059701492537314,
"eval_overall_precision": 0.7462311557788944,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9164,
"eval_samples_per_second": 204.054,
"eval_steps_per_second": 3.274,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.5706373453140259,
"learning_rate": 3.6e-05,
"loss": 0.1306,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7682119205298013,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7151515151515152,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6555555555555556,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8750000000000001,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8260869565217391,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13230037689208984,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8005502063273728,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8584070796460177,
"eval_runtime": 0.9167,
"eval_samples_per_second": 203.989,
"eval_steps_per_second": 3.273,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 1.6984310150146484,
"learning_rate": 3.55e-05,
"loss": 0.1282,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7176470588235295,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6421052631578947,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13585858047008514,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8159340659340658,
"eval_overall_precision": 0.7634961439588689,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9131,
"eval_samples_per_second": 204.804,
"eval_steps_per_second": 3.286,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.8933135271072388,
"learning_rate": 3.5e-05,
"loss": 0.1235,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7159090909090909,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6237623762376238,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13996899127960205,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8054054054054054,
"eval_overall_precision": 0.743142144638404,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9167,
"eval_samples_per_second": 203.988,
"eval_steps_per_second": 3.273,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.8632007837295532,
"learning_rate": 3.45e-05,
"loss": 0.124,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.7741935483870969,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7176470588235295,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6421052631578947,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13782481849193573,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.8021680216802167,
"eval_overall_precision": 0.7418546365914787,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9178,
"eval_samples_per_second": 203.741,
"eval_steps_per_second": 3.269,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 1.97568941116333,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.1222,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7361963190184048,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6818181818181818,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8896321070234114,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8525641025641025,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13005581498146057,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8144044321329639,
"eval_overall_precision": 0.7676240208877284,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9102,
"eval_samples_per_second": 205.446,
"eval_steps_per_second": 3.296,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.2445570230484009,
"learning_rate": 3.35e-05,
"loss": 0.1243,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7380952380952381,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8866666666666668,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8471337579617835,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13504153490066528,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8076398362892225,
"eval_overall_precision": 0.751269035532995,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9062,
"eval_samples_per_second": 206.352,
"eval_steps_per_second": 3.31,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.8017980456352234,
"learning_rate": 3.3e-05,
"loss": 0.1198,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7209302325581395,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6391752577319587,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1404941827058792,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.797843665768194,
"eval_overall_precision": 0.7344913151364765,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9094,
"eval_samples_per_second": 205.619,
"eval_steps_per_second": 3.299,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.849617600440979,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.1186,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.72,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.63,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1358003318309784,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.803788903924222,
"eval_overall_precision": 0.7425,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9073,
"eval_samples_per_second": 206.098,
"eval_steps_per_second": 3.306,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.2370284795761108,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.1177,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7272727272727272,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1319529414176941,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8027397260273973,
"eval_overall_precision": 0.7493606138107417,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9101,
"eval_samples_per_second": 205.474,
"eval_steps_per_second": 3.296,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 2.0164999961853027,
"learning_rate": 3.15e-05,
"loss": 0.1183,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.757396449704142,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6808510638297872,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13670241832733154,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8119079837618404,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9293,
"eval_samples_per_second": 201.235,
"eval_steps_per_second": 3.228,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 1.5912907123565674,
"learning_rate": 3.1e-05,
"loss": 0.1145,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6774193548387096,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8794788273615636,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.823170731707317,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5964912280701754,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13946709036827087,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.7983761840324762,
"eval_overall_precision": 0.7375,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.918,
"eval_samples_per_second": 203.705,
"eval_steps_per_second": 3.268,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.7153412103652954,
"learning_rate": 3.05e-05,
"loss": 0.1138,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7251461988304094,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6458333333333334,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.1324165016412735,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.810958904109589,
"eval_overall_precision": 0.7570332480818415,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9158,
"eval_samples_per_second": 204.202,
"eval_steps_per_second": 3.276,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 1.3694576025009155,
"learning_rate": 3e-05,
"loss": 0.1131,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7469879518072289,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6813186813186813,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13166731595993042,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8049450549450551,
"eval_overall_precision": 0.7532133676092545,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9126,
"eval_samples_per_second": 204.913,
"eval_steps_per_second": 3.287,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 1.4050893783569336,
"learning_rate": 2.95e-05,
"loss": 0.1123,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7529411764705883,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6736842105263158,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8729641693811075,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8170731707317073,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13514545559883118,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.7989203778677463,
"eval_overall_precision": 0.736318407960199,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9113,
"eval_samples_per_second": 205.195,
"eval_steps_per_second": 3.292,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 1.5570241212844849,
"learning_rate": 2.9e-05,
"loss": 0.1123,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7425149700598803,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6739130434782609,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8852459016393444,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5964912280701754,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13604854047298431,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8059701492537314,
"eval_overall_precision": 0.7462311557788944,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9129,
"eval_samples_per_second": 204.836,
"eval_steps_per_second": 3.286,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.9890122413635254,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.1106,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7425149700598803,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6739130434782609,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8322981366459627,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13483330607414246,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8021828103683494,
"eval_overall_precision": 0.7461928934010152,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9143,
"eval_samples_per_second": 204.536,
"eval_steps_per_second": 3.281,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 1.2907875776290894,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.1104,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7484662576687117,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6931818181818182,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8322981366459627,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6153846153846154,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5517241379310345,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.13180701434612274,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8099173553719009,
"eval_overall_precision": 0.7596899224806202,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9205,
"eval_samples_per_second": 203.159,
"eval_steps_per_second": 3.259,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.4953218698501587,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.1084,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7294117647058824,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6526315789473685,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8947368421052632,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13945060968399048,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.8010825439783491,
"eval_overall_precision": 0.74,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9155,
"eval_samples_per_second": 204.271,
"eval_steps_per_second": 3.277,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.8582813143730164,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.1084,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1349920630455017,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8147138964577656,
"eval_overall_precision": 0.7569620253164557,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9125,
"eval_samples_per_second": 204.932,
"eval_steps_per_second": 3.288,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.8841750621795654,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.109,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7741935483870969,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.736842105263158,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.65625,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13927918672561646,
"eval_overall_accuracy": 0.955716787590693,
"eval_overall_f1": 0.7999999999999999,
"eval_overall_precision": 0.7381546134663342,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.904,
"eval_samples_per_second": 206.86,
"eval_steps_per_second": 3.319,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 1.2972251176834106,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.1058,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.7741935483870969,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7126436781609197,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6262626262626263,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13838200271129608,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.7951482479784365,
"eval_overall_precision": 0.7320099255583127,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9049,
"eval_samples_per_second": 206.648,
"eval_steps_per_second": 3.315,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 5.139357566833496,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.1072,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7469879518072289,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6813186813186813,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6153846153846154,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5517241379310345,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1352456659078598,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8093278463648834,
"eval_overall_precision": 0.7564102564102564,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.912,
"eval_samples_per_second": 205.038,
"eval_steps_per_second": 3.289,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.3401834964752197,
"learning_rate": 2.5e-05,
"loss": 0.1048,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7469879518072289,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6813186813186813,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13750846683979034,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8076398362892225,
"eval_overall_precision": 0.751269035532995,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9784,
"eval_samples_per_second": 191.121,
"eval_steps_per_second": 3.066,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 1.4734350442886353,
"learning_rate": 2.45e-05,
"loss": 0.1052,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7294117647058824,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6526315789473685,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6037735849056605,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5333333333333333,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13331173360347748,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.7989130434782608,
"eval_overall_precision": 0.7405541561712846,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9147,
"eval_samples_per_second": 204.445,
"eval_steps_per_second": 3.28,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 1.5722417831420898,
"learning_rate": 2.4e-05,
"loss": 0.1028,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7411764705882353,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6631578947368421,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13255049288272858,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8043478260869565,
"eval_overall_precision": 0.7455919395465995,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9289,
"eval_samples_per_second": 201.318,
"eval_steps_per_second": 3.23,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 2.0618319511413574,
"learning_rate": 2.35e-05,
"loss": 0.1022,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7294117647058824,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6526315789473685,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6037735849056605,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5333333333333333,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1327483206987381,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.7999999999999999,
"eval_overall_precision": 0.7424242424242424,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.91,
"eval_samples_per_second": 205.495,
"eval_steps_per_second": 3.297,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 2.0054030418395996,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.103,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7664670658682634,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6956521739130435,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1331961452960968,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8114754098360656,
"eval_overall_precision": 0.7557251908396947,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.912,
"eval_samples_per_second": 205.05,
"eval_steps_per_second": 3.29,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 2.02776837348938,
"learning_rate": 2.25e-05,
"loss": 0.1018,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7692307692307692,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7222222222222222,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5964912280701754,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14076703786849976,
"eval_overall_accuracy": 0.9542156617463098,
"eval_overall_f1": 0.7936085219707057,
"eval_overall_precision": 0.7233009708737864,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9914,
"eval_samples_per_second": 188.627,
"eval_steps_per_second": 3.026,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 1.5651822090148926,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.1008,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7804878048780487,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7191011235955056,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8322981366459627,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13218992948532104,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8098495212038302,
"eval_overall_precision": 0.7551020408163265,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9174,
"eval_samples_per_second": 203.846,
"eval_steps_per_second": 3.27,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 1.6610524654388428,
"learning_rate": 2.15e-05,
"loss": 0.0998,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7607361963190183,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7045454545454546,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13176319003105164,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8076923076923076,
"eval_overall_precision": 0.7557840616966581,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9137,
"eval_samples_per_second": 204.653,
"eval_steps_per_second": 3.283,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.7417497038841248,
"learning_rate": 2.1e-05,
"loss": 0.0985,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7710843373493976,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7032967032967034,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13647660613059998,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8169398907103824,
"eval_overall_precision": 0.7608142493638677,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9157,
"eval_samples_per_second": 204.204,
"eval_steps_per_second": 3.276,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.8337518572807312,
"learning_rate": 2.05e-05,
"loss": 0.0977,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7529411764705883,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6736842105263158,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6071428571428571,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5151515151515151,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1379348784685135,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.8102981029810299,
"eval_overall_precision": 0.7493734335839599,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9422,
"eval_samples_per_second": 198.465,
"eval_steps_per_second": 3.184,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.6735620498657227,
"learning_rate": 2e-05,
"loss": 0.0991,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7602339181286549,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6770833333333334,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13909530639648438,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8130081300813008,
"eval_overall_precision": 0.7518796992481203,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9803,
"eval_samples_per_second": 190.75,
"eval_steps_per_second": 3.06,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.355182409286499,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0987,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.7741935483870969,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7428571428571429,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14097541570663452,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8075370121130552,
"eval_overall_precision": 0.7425742574257426,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.914,
"eval_samples_per_second": 204.604,
"eval_steps_per_second": 3.282,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.8147560358047485,
"learning_rate": 1.9e-05,
"loss": 0.099,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7636363636363636,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13552354276180267,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8093278463648834,
"eval_overall_precision": 0.7564102564102564,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9112,
"eval_samples_per_second": 205.226,
"eval_steps_per_second": 3.292,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.5771262049674988,
"learning_rate": 1.85e-05,
"loss": 0.0967,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13627471029758453,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8125854993160055,
"eval_overall_precision": 0.7576530612244898,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9093,
"eval_samples_per_second": 205.662,
"eval_steps_per_second": 3.299,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 1.4576925039291382,
"learning_rate": 1.8e-05,
"loss": 0.0976,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.7741935483870969,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7398843930635838,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6530612244897959,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.5714285714285715,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.48484848484848486,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13925473392009735,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8032345013477089,
"eval_overall_precision": 0.739454094292804,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9093,
"eval_samples_per_second": 205.657,
"eval_steps_per_second": 3.299,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 12.998764991760254,
"learning_rate": 1.75e-05,
"loss": 0.0977,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7664670658682634,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6956521739130435,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6181818181818182,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.53125,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13550983369350433,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8103683492496591,
"eval_overall_precision": 0.7538071065989848,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9302,
"eval_samples_per_second": 201.031,
"eval_steps_per_second": 3.225,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 1.033444881439209,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.096,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13633564114570618,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8065395095367849,
"eval_overall_precision": 0.7493670886075949,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9065,
"eval_samples_per_second": 206.297,
"eval_steps_per_second": 3.31,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.6555174589157104,
"learning_rate": 1.65e-05,
"loss": 0.0958,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7710843373493976,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7032967032967034,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6296296296296297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5483870967741935,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13482040166854858,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8136986301369864,
"eval_overall_precision": 0.7595907928388747,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9171,
"eval_samples_per_second": 203.894,
"eval_steps_per_second": 3.271,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 1.1487456560134888,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.096,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13745680451393127,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8142076502732241,
"eval_overall_precision": 0.7582697201017812,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9069,
"eval_samples_per_second": 206.198,
"eval_steps_per_second": 3.308,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 1.4904353618621826,
"learning_rate": 1.55e-05,
"loss": 0.0956,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.7631578947368423,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7590361445783131,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13514593243598938,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8065843621399177,
"eval_overall_precision": 0.7538461538461538,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9093,
"eval_samples_per_second": 205.654,
"eval_steps_per_second": 3.299,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.8389599919319153,
"learning_rate": 1.5e-05,
"loss": 0.0952,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7425149700598803,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6739130434782609,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.881578947368421,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8322981366459627,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6037735849056605,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5333333333333333,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13362941145896912,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8005464480874317,
"eval_overall_precision": 0.7455470737913485,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9037,
"eval_samples_per_second": 206.933,
"eval_steps_per_second": 3.32,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 1.3361512422561646,
"learning_rate": 1.45e-05,
"loss": 0.0956,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13655199110507965,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8038147138964578,
"eval_overall_precision": 0.7468354430379747,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9117,
"eval_samples_per_second": 205.103,
"eval_steps_per_second": 3.29,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 1.1266378164291382,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0948,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13651823997497559,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8081632653061224,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9168,
"eval_samples_per_second": 203.972,
"eval_steps_per_second": 3.272,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 1.7619799375534058,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.096,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6037735849056605,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5333333333333333,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13442060351371765,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8082191780821917,
"eval_overall_precision": 0.7544757033248082,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9164,
"eval_samples_per_second": 204.061,
"eval_steps_per_second": 3.274,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.590961217880249,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0939,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.7612903225806451,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.14096762239933014,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8005427408412482,
"eval_overall_precision": 0.7412060301507538,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9114,
"eval_samples_per_second": 205.17,
"eval_steps_per_second": 3.291,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 1.3473641872406006,
"learning_rate": 1.25e-05,
"loss": 0.0936,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7558139534883721,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6701030927835051,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13918167352676392,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8032564450474898,
"eval_overall_precision": 0.7437185929648241,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9163,
"eval_samples_per_second": 204.086,
"eval_steps_per_second": 3.274,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 1.2699788808822632,
"learning_rate": 1.2e-05,
"loss": 0.0923,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7647058823529413,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1376781463623047,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8070652173913044,
"eval_overall_precision": 0.7481108312342569,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9152,
"eval_samples_per_second": 204.323,
"eval_steps_per_second": 3.278,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.7005648612976074,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0914,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7558139534883721,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6701030927835051,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13786636292934418,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8016304347826085,
"eval_overall_precision": 0.743073047858942,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9115,
"eval_samples_per_second": 205.158,
"eval_steps_per_second": 3.291,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 1.3490372896194458,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0921,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7515151515151515,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6888888888888889,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1341177523136139,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8065843621399177,
"eval_overall_precision": 0.7538461538461538,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9056,
"eval_samples_per_second": 206.504,
"eval_steps_per_second": 3.313,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 1.7868270874023438,
"learning_rate": 1.05e-05,
"loss": 0.0917,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7631578947368423,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6037735849056605,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5333333333333333,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1321086883544922,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8104395604395604,
"eval_overall_precision": 0.7583547557840618,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.912,
"eval_samples_per_second": 205.039,
"eval_steps_per_second": 3.289,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.7334626913070679,
"learning_rate": 1e-05,
"loss": 0.0918,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1394556760787964,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8027210884353742,
"eval_overall_precision": 0.7449494949494949,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9129,
"eval_samples_per_second": 204.847,
"eval_steps_per_second": 3.286,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 1.6766005754470825,
"learning_rate": 9.5e-06,
"loss": 0.0925,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.757396449704142,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6808510638297872,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.137154683470726,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8021828103683494,
"eval_overall_precision": 0.7461928934010152,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9114,
"eval_samples_per_second": 205.177,
"eval_steps_per_second": 3.292,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.6531654596328735,
"learning_rate": 9e-06,
"loss": 0.0901,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.757396449704142,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6808510638297872,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13694968819618225,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8021828103683494,
"eval_overall_precision": 0.7461928934010152,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9646,
"eval_samples_per_second": 193.863,
"eval_steps_per_second": 3.11,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 3.4270708560943604,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0914,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.757396449704142,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6808510638297872,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1351262480020523,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8032786885245901,
"eval_overall_precision": 0.7480916030534351,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.908,
"eval_samples_per_second": 205.949,
"eval_steps_per_second": 3.304,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 1.2858631610870361,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0908,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7647058823529413,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13691945374011993,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8049113233287858,
"eval_overall_precision": 0.748730964467005,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9149,
"eval_samples_per_second": 204.386,
"eval_steps_per_second": 3.279,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 2.4220991134643555,
"learning_rate": 7.5e-06,
"loss": 0.0937,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7647058823529413,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13628537952899933,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8065395095367849,
"eval_overall_precision": 0.7493670886075949,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.91,
"eval_samples_per_second": 205.496,
"eval_steps_per_second": 3.297,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 1.8708733320236206,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0926,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7380952380952381,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1368514746427536,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.7978142076502732,
"eval_overall_precision": 0.7430025445292621,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.9121,
"eval_samples_per_second": 205.021,
"eval_steps_per_second": 3.289,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 1.4662730693817139,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.09,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.7712418300653595,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7425149700598803,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6739130434782609,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1350514441728592,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.803840877914952,
"eval_overall_precision": 0.7512820512820513,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9064,
"eval_samples_per_second": 206.321,
"eval_steps_per_second": 3.31,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.9708890318870544,
"learning_rate": 6e-06,
"loss": 0.0895,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6774193548387096,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13717986643314362,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8032786885245901,
"eval_overall_precision": 0.7480916030534351,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9061,
"eval_samples_per_second": 206.382,
"eval_steps_per_second": 3.311,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.9818236231803894,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0907,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13800707459449768,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8010899182561309,
"eval_overall_precision": 0.7443037974683544,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9188,
"eval_samples_per_second": 203.525,
"eval_steps_per_second": 3.265,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.852787971496582,
"learning_rate": 5e-06,
"loss": 0.0876,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.137681245803833,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8076398362892225,
"eval_overall_precision": 0.751269035532995,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9141,
"eval_samples_per_second": 204.564,
"eval_steps_per_second": 3.282,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 1.275254487991333,
"learning_rate": 4.5e-06,
"loss": 0.0901,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7738095238095238,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6989247311827957,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1385199874639511,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8076398362892225,
"eval_overall_precision": 0.751269035532995,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9137,
"eval_samples_per_second": 204.659,
"eval_steps_per_second": 3.283,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 6.197476387023926,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0937,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.757396449704142,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6808510638297872,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1368849277496338,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8049113233287858,
"eval_overall_precision": 0.748730964467005,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9187,
"eval_samples_per_second": 203.55,
"eval_steps_per_second": 3.266,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.66109699010849,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0879,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13911746442317963,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8038147138964578,
"eval_overall_precision": 0.7468354430379747,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9162,
"eval_samples_per_second": 204.094,
"eval_steps_per_second": 3.274,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.9965635538101196,
"learning_rate": 3e-06,
"loss": 0.0903,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13771039247512817,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8065395095367849,
"eval_overall_precision": 0.7493670886075949,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9132,
"eval_samples_per_second": 204.777,
"eval_steps_per_second": 3.285,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.8963160514831543,
"learning_rate": 2.5e-06,
"loss": 0.0895,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13782991468906403,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8076398362892225,
"eval_overall_precision": 0.751269035532995,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9219,
"eval_samples_per_second": 202.849,
"eval_steps_per_second": 3.254,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.9854846000671387,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0923,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.1382056623697281,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8038147138964578,
"eval_overall_precision": 0.7468354430379747,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9084,
"eval_samples_per_second": 205.85,
"eval_steps_per_second": 3.302,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.8474765419960022,
"learning_rate": 1.5e-06,
"loss": 0.0893,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5818181818181818,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13706086575984955,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8092643051771118,
"eval_overall_precision": 0.7518987341772152,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9212,
"eval_samples_per_second": 202.999,
"eval_steps_per_second": 3.257,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 2.321481704711914,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0884,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13722318410873413,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8103683492496591,
"eval_overall_precision": 0.7538071065989848,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9082,
"eval_samples_per_second": 205.909,
"eval_steps_per_second": 3.303,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.8234521150588989,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0881,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13734257221221924,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8103683492496591,
"eval_overall_precision": 0.7538071065989848,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9101,
"eval_samples_per_second": 205.475,
"eval_steps_per_second": 3.296,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.8098838925361633,
"learning_rate": 0.0,
"loss": 0.0886,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7692307692307693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6914893617021277,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.5925925925925926,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.13735896348953247,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8103683492496591,
"eval_overall_precision": 0.7538071065989848,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9149,
"eval_samples_per_second": 204.394,
"eval_steps_per_second": 3.279,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4517924176755654.0,
"train_loss": 0.14866713703803297,
"train_runtime": 1220.9124,
"train_samples_per_second": 138.175,
"train_steps_per_second": 8.682
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4517924176755654.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}